commands.txt (1040B)
1 # Here are the raw operations that were used to process the data 2 # Note that the registation file is not versioned here because it contains 3 # personal information 4 5 - select the right columns in libreoffice 6 - replace the newlines in libreoffice 7 - cat high2025_orders_2025_08_29_filter.csv| grep '^paid;' | grep -v "Online only ticket" | cut -d';' -f2,3,4,6- > onsites.csv 8 - checked that the other statuses than "paid" look bad 9 - checked that the prices paid make sense 10 - checked that there are no duplicates 11 - eliminate local participants, yielding onsites_anon_nolocal.csv 12 - manually complete locations, yielding onsites_anon_nolocal_completed.csv 13 - cut -d';' -f7-12 onsites_anon_nolocal_completed.csv > location_mode_extension.csv 14 - cat location_mode_extension.csv| cut -d';' -f1 > locations.txt 15 - cat location_mode_extension.csv| cut -d';' -f3 >> locations.txt 16 - cat locations.txt| sort | uniq > locations_uniq.txt 17 18 cat <(yes 0 | head -28) <(cat footprints.txt | sort -n | awk '{s+= $0; print s}') > footprints_withlocal_cumul.txt