canteen-info

scrape weekly menus from canteens surrounding Aarhus University
git clone git://src.adamsgaard.dk/canteen-info # fast
git clone https://src.adamsgaard.dk/canteen-info.git # slow
Log | Files | Refs | README | LICENSE Back to index

matkant (478B)


      1 #!/bin/bash
      2 set -e
      3 
      4 # requires html2text package
      5 
      6 tmpfile=/tmp/matkant.html
      7 page=http://www.matkant.dk/dagmenu.php
      8 
      9 wget $page -O $tmpfile --quiet
     10 
     11 html2text $tmpfile > $tmpfile.txt
     12 
     13 cat $tmpfile.txt |\
     14     sed -n '/\* Mandag\|\* Tirsdag\|\* Onsdag\|\* Torsdag\|\* Fredag/,$p' |\
     15     #sed 's/XHTML.*//' |\
     16     #sed -n '/.*Mandag\|.*Tirsdag\|.*Onsdag\|.*Torsdag\|.*Fredag\|.*Lørdag\|.*Søndag/q;p' |\
     17     sed -n '/.*Lørdag/q;p' |\
     18     grep -v '^$'
     19 
     20 rm $tmpfile
     21 rm $tmpfile.txt