Difference between revisions of "User:Andreas Plank/Useful Scripts (Linux)"

From CETAF Identifiers Wiki
Jump to: navigation, search
m (+ links)
m (:: => » :: «)
Line 39: Line 39:
 
   # parse multiple files and concatenate the { items : [] }
 
   # parse multiple files and concatenate the { items : [] }
  
   jq '.items|=sort_by(.name)|.items [] | (.id + "::" + .name + "::" + .links[0])' ror.org_page-all.json
+
   jq '.items|=sort_by(.name)|.items [] | (.id + " :: " + .name + " :: " + .links[0])' ror.org_page-all.json
 
   # find in { items : [ {id : … , name : … , links : [ ] }] } and concatenate them via "::"
 
   # find in { items : [ {id : … , name : … , links : [ ] }] } and concatenate them via "::"
 
else
 
else
Line 45: Line 45:
 
fi
 
fi
 
# #### result list
 
# #### result list
# "https://ror.org/02ya7hp91::ALZHIR Museum and Memorial Complex::https://museum-alzhir.kz/en"
+
# "https://ror.org/02ya7hp91 :: ALZHIR Museum and Memorial Complex :: https://museum-alzhir.kz/en"
# "https://ror.org/02pvtxb60::ASTRA National Museum Complex::http://www.muzeulastra.ro/"
+
# "https://ror.org/02pvtxb60 :: ASTRA National Museum Complex :: http://www.muzeulastra.ro/"
 
# …
 
# …
# "https://ror.org/00bv4cx53::Botanischer Garten und Botanisches Museum Berlin::https://www.bgbm.org/"
+
# "https://ror.org/00bv4cx53 :: Botanischer Garten und Botanisches Museum Berlin :: https://www.bgbm.org/"
 
# …
 
# …
# "https://ror.org/01h1jbk91::Meise Botanic Garden::https://www.plantentuinmeise.be/en/"
+
# "https://ror.org/01h1jbk91 :: Meise Botanic Garden :: https://www.plantentuinmeise.be/en/"
 
# …
 
# …
# "https://ror.org/03wkt5x30::National Museum of Natural History::http://www.mnhn.fr/fr"
+
# "https://ror.org/03wkt5x30 :: National Museum of Natural History :: http://www.mnhn.fr/fr"
 
# …
 
# …
# "https://ror.org/0349vqz63::Royal Botanic Garden Edinburgh::http://www.rbge.org.uk/"
+
# "https://ror.org/0349vqz63 :: Royal Botanic Garden Edinburgh :: http://www.rbge.org.uk/"
 
# …
 
# …
# "https://ror.org/03pjnvf85::Zürich Zoological Garden::https://www.zoo.ch/"
+
# "https://ror.org/03pjnvf85 :: Zürich Zoological Garden :: https://www.zoo.ch/"
 
# …
 
# …
 
# ##############################################
 
# ##############################################
 
</syntaxhighlight>
 
</syntaxhighlight>

Revision as of 10:04, 1 July 2020

Get IDs of api.ror.org by Query

# ##############################################
# dependency: curl
# dependency: jq (JSON tool)
# dependency: awk
# get from exact query

# #### returned JSON
# { 
#   "number_of_results": 1,
#   "time_taken": 41,
#   "items": [
#     {
#       "id": "https://ror.org/00bv4cx53",
#       "name": "Botanischer Garten und Botanisches Museum Berlin",
#       "types": [
#         "Archive"
#   …
# }

# #### one entry by exact query phrase
curl -G https://api.ror.org/organizations --data-urlencode 'query="Botanischer Garten und Botanisches Museum Berlin"' | jq . > bgbm.org.json
jq '.items|=sort_by(.name)|.items [] | (.id + "::" + .name)' bgbm.org.json 
# "https://ror.org/00bv4cx53::Botanischer Garten und Botanisches Museum Berlin"

# #### get from multiple result pages
query_string="Botanisch Garten garden botanical"
number_of_results=`curl --silent --get https://api.ror.org/organizations --data-urlencode "query=$query_string" | jq ".number_of_results"`
number_of_pages=`echo "scale=0; ${number_of_results}/20 + 0.5" | bc -l | awk '{printf("%d\n",$1 + 0.5)}'`
if [[ "$number_of_pages" =~ ^[0-9]+$ ]]; then
  for ((p=1; p<=$number_of_pages; p++)); do
  echo "# get content of page $p => ror.org_page-$p.json"
    contents=$(curl --silent --get https://api.ror.org/organizations --data-urlencode "query=$query_string" --data-urlencode "page=$p" )
    echo "$contents" > "ror.org_page-$p.json"
  done
  jq --slurp '{ items: map(.items[]) }' ror.org_page-*.json > ror.org_page-all.json
  # parse multiple files and concatenate the { items : [] }

  jq '.items|=sort_by(.name)|.items [] | (.id + " :: " + .name + " :: " + .links[0])' ror.org_page-all.json
  # find in { items : [ {id : … , name : … , links : [ ] }] } and concatenate them via "::"
else
  echo "Something wrong: \$number_of_pages is not an integer ()"
fi
# #### result list
# "https://ror.org/02ya7hp91 :: ALZHIR Museum and Memorial Complex :: https://museum-alzhir.kz/en"
# "https://ror.org/02pvtxb60 :: ASTRA National Museum Complex :: http://www.muzeulastra.ro/"
# …
# "https://ror.org/00bv4cx53 :: Botanischer Garten und Botanisches Museum Berlin :: https://www.bgbm.org/"
# …
# "https://ror.org/01h1jbk91 :: Meise Botanic Garden :: https://www.plantentuinmeise.be/en/"
# …
# "https://ror.org/03wkt5x30 :: National Museum of Natural History :: http://www.mnhn.fr/fr"
# …
# "https://ror.org/0349vqz63 :: Royal Botanic Garden Edinburgh :: http://www.rbge.org.uk/"
# …
# "https://ror.org/03pjnvf85 :: Zürich Zoological Garden :: https://www.zoo.ch/"
# …
# ##############################################