Browse Source

Add support for WARC/1.1

master
JustAnotherArchivist 4 years ago
parent
commit
c13a1150df
1 changed files with 1 additions and 1 deletions
  1. +1
    -1
      warc-tiny

+ 1
- 1
warc-tiny View File

@@ -102,7 +102,7 @@ def iter_warc(f):
if not buf:
break
warcHeaderBuf, buf = buf.split(b'\r\n\r\n', 1)
assert warcHeaderBuf.startswith(b'WARC/1.0\r\n')
assert warcHeaderBuf.startswith(b'WARC/1.0\r\n') or warcHeaderBuf.startswith(b'WARC/1.1\r\n')
assert b'\r\nContent-Length:' in warcHeaderBuf
warcHeaders = tuple(tuple(map(bytes.strip, x.split(b':', 1))) for x in warcHeaderBuf.split(b'\r\n'))
warcContentType = next(x[1] for x in warcHeaders if x[0] == b'Content-Type')


Loading…
Cancel
Save