new things
This commit is contained in:
16
pdf2bib.sh
16
pdf2bib.sh
@@ -31,13 +31,25 @@ echo "using $bibdFileOut"
|
||||
|
||||
#try to extract doi from pdf and retrieve a pubmed id
|
||||
#for 'DOI:' syntax
|
||||
doi=$(pdftotext -q -f 1 -l 1 $fn - | grep -i doi: --max-count=1 | tr [:upper:] [:lower:] | sed -E "s#doi:(.+)#\1#")
|
||||
# doi=$(pdftotext -q -f 1 -l 1 $fn - | grep -i "doi:" --max-count=1 | tr [:upper:] [:lower:] | sed -E "s#doi:(.+)#\1#")
|
||||
|
||||
doi=$(pdftotext -q -f 1 -l 1 $fn - | grep -iE "doi:? ?/?10\." --max-count=1 | tr [:upper:] [:lower:] | sed -E "s#.*doi:? ?/?(10.+)#\1#")
|
||||
|
||||
|
||||
#for 'https://doi.org' syntax
|
||||
if [ -z "$doi" ]; then
|
||||
doi=$(pdftotext -q -f 1 -l 1 $fn - | grep -i "doi.org/" --max-count=1 | tr [:upper:] [:lower:] | sed -E "s#.+doi\.org\/(.+)#\1#")
|
||||
doi=$(pdftotext -q -f 1 -l 1 $fn - | grep -iE "doi\.org/10\." --max-count=1 | tr [:upper:] [:lower:] | sed -E "s#.+doi\.org/(10.+)#\1#")
|
||||
fi
|
||||
|
||||
# for 'https://doi.org' syntax
|
||||
# if [ -z "$doi" ]; then
|
||||
# doi=$(pdftotext -q -f 1 -l 1 $fn - | grep -i "doi.org/" --max-count=1 | tr [:upper:] [:lower:] | sed -E "s#.+doi\.org\/(.+)#\1#")
|
||||
# fi
|
||||
#
|
||||
# if [ -z "$doi" ]; then
|
||||
# doi=$(pdftotext -q -f 1 -l 1 $fn - | grep -iE "doi ?" --max-count=1 | tr [:upper:] [:lower:] | sed -E "s#doi ?(.+)#\1#")
|
||||
# fi
|
||||
|
||||
if [ -z "$doi" ]; then
|
||||
echo "doi not found"
|
||||
exit 1
|
||||
|
||||
Reference in New Issue
Block a user