#!/usr/bin/bash ARTIST=140308 # 116 is Kasane Teto CHILDREN="true" # If we want child voicebanks, we do so we can get all songs from utau, sv, and sv2 START=0 # Start at the beginning of the recordset. if i wanted to make the file in chunks to use the api less i would use this and max to get the songs in chunks. They say dont use it "thousands of times a day", getting every teto song is 280 times. I think I'm ok. maybe. RESULTS=100 # Max results. Limit is 100. MAX=30000 # when to stop, there's as of 4-23-26 over 28,000 songs featuring Kasane Teto in the recordset i have selected. if [ ! -f dates/${ARTIST}var.json ]; then # var.json has our latest date, we use it to know where to stop going back, past it the songs already exist in the fortune file. echo '{"lastDate": "2000-04-21T00:00:00Z"}' > dates/${ARTIST}var.json # if it doesn't exist, we create it with a default date back in 2000. fi PREVDATE=$(jq -r '.lastDate' dates/${ARTIST}var.json) AFTERDATE=$(date -u -d "$PREVDATE + 1 Second" +"%Y-%m-%dT%H:%M:%SZ") echo "Result: $AFTERDATE" #rm tetofortunes var.json tetofortunes.dat # during testing we will remove everything, or if we want to regenerate the fortune file from scratch. # setting the latest date. just pulling the latest song from the api and setting the createDate as the latest date in var.json for use when we update the fortune file again, dont want to add the same songs twice. idk how I'll handle broken links and such, maybe just regenerate the whole thing periodically. CURLURL="https://vocadb.net/api/songs?songTypes=Original&afterDate=${AFTERDATE}&&artistId%5B%5D=${ARTIST}&childVoicebanks=${CHILDREN}&onlyWithPvs=true&status=Finished&start=0&maxResults=1&sort=PublishDate&fields=PVs" echo "CURLURL: $CURLURL" DATA=$(curl -X 'GET' \ $CURLURL \ -H 'accept: application/json') # making sure there are songs to add. SONGS=$(echo "$DATA" | jq -c '.items | length') if [ "$SONGS" -eq 0 ]; then echo "Result is empty. No more songs." exit 0 fi DATE=$(date -u +%Y-%m-%dT00:00:00Z) echo "DATE: $DATE" echo "{\"lastDate\": \"$DATE\"}" > dates/${ARTIST}var.json # looping the api to get all songs we need. while true; do CURLURL="https://vocadb.net/api/songs?songTypes=Original&afterDate=${AFTERDATE}&&artistId%5B%5D=${ARTIST}&childVoicebanks=${CHILDREN}&onlyWithPvs=true&status=Finished&start=${START}&maxResults=${RESULTS}&sort=PublishDate&fields=PVs" DATA=$(curl -X 'GET' \ $CURLURL \ -H 'accept: application/json') SONGS=$(echo "$DATA" | jq -r '.items | length') if [ "$SONGS" -eq 0 ]; then echo "Result is empty. No more songs." break else START=$((START + SONGS)) echo "Found songs! Processing... (Total fetched: $START)" echo "$DATA" | jq -r '.items[] | [.artistString, .defaultName, .pvs[0].url] | @tsv' | while IFS=$'\t' read -r artist name url; do echo "TETO SONG OF THE DAY!" echo "" echo "$artist -- $name" echo "" echo "$url" echo "" echo "▼・ᴗ・▼" echo "\`" done >> vocafortunes/vocadb/$ARTIST if [ "$START" -ge "$MAX" ]; then echo "Reached max results. Stopping." break fi echo "Done!" fi done readarray -d '`' tetosongs < vocafortunes/vocadb/$ARTIST readarray -td '' dups < <( (( ${#tetosongs[@]} == 0 )) || printf '%s\0' "${tetosongs[@]}" | LC_ALL=C sort -z | LC_ALL=C uniq -zd ) readarray -td '' uniq < <( (( ${#tetosongs[@]} == 0 )) || printf '%s\0' "${tetosongs[@]}" | LC_ALL=C sort -z | LC_ALL=C uniq -zu ) echo ${#tetosongs[@]} if ((${#dups[@]} > 0)); then echo >&2 "array has duplicates:" echo ${#dups[@]} fi if ((${#uniq[@]} > 0)); then echo >&2 "Uniques:" echo ${#uniq[@]} fi printf >&2 '%s' "${dups[@]}" > dups printf >&2 '%s' "${uniq[@]}" > uniq cat uniq > fixed cat dups >> fixed sed -i '1,/^TETO SONG OF THE DAY!/{/^TETO SONG OF THE DAY!$/!d}' fixed rm vocafortunes/vocadb/$ARTIST rm uniq dups mv fixed vocafortunes/vocadb/$ARTIST # create the fortune database from tetofortunes #rm tetofortunes.dat # delete the old database if it extists. #strfile -c % tetofortunes tetofortunes.dat