ISNI
VIAF
wget http://viaf.org/viaf/data/viaf-20170906-links.txt.gz
make smaller
gunzip < viaf-20170906-links.txt.gz | bzip2 > viaf-20170906-links.txt.bz2
extract uncompressed file (keep original compressed file)
gunzip -c viaf-20170906-links.txt.gz > viaf-20170906-links.txt
see sizes
ls -la -rw-r--r-- 1 root root 4440512262 Sep 21 11:44 viaf-20170906-links.txt -rw-r--r-- 1 root root 666148170 Sep 21 11:28 viaf-20170906-links.txt.bz2 -rw-r--r-- 1 root root 814025893 Sep 7 10:36 viaf-20170906-links.txt.gz
view data
zcat viaf-20170906-links.txt.gz | head -n 100
extract lines that contain "ISNI"
zcat viaf-20170906-links.txt.gz | fgrep 'ISNI' > viaf-20170906-links.isni.txt
remove viaf and isni prefixes and sort by ISNI
zcat viaf-20170906-links.txt.gz | fgrep 'ISNI' | sed -e 's@http://viaf.org/viaf/@@' -e s'/ISNI|//' | sort -k2 | gzip > viaf-20170906-links.isni-noprefix.sortbyisni.txt.gz