do not mistake pcaxis for text/html

......@@ -117,9 +117,12 @@ def sniff_file_format(filepath, log):
format_ = {'format': 'TTL'}
elif format_['format'] == 'HTML':
# maybe it has RDFa in it
with open(filepath) as f:
buf =
# might really be PCAXIS
if is_pcaxis(buf, log):
format_ = {'format': 'PCAXIS'}
# maybe it has RDFa in it
if has_rdfa(buf, log):
format_ = {'format': 'RDFa'}
