*.arc -text *.warc -text *.idx -text *.idxj -text *.cdx -text *.cdxj -text *.gz -text