summaryrefslogtreecommitdiff
path: root/unpack-pubmed
blob: a671512627ecdc3b5017e4854120e1e33de07aaf (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
#!/bin/sh

flags="none"

if [ "$#" -gt 0 ]
then
  flags="$1"
fi

for fl in *.xml.gz
do
  base=${fl%.xml.gz}
  if [ -f "$base.xml" ]
  then
    continue
  fi
  echo "$fl"
  gunzip -c "$base.xml.gz" | xtract -flags "$flags" -unique "$base.uid" -index MedlineCitation/PMID \
    -head "<PubmedArticleSet>" -tail "</PubmedArticleSet>" -pattern PubmedArticle > "$base.xml"
done