apt-get upgrade -y
apt-get install -y python-pip postgresql python-virtualenv virtualenvwrapper \
git nginx postgresql-server-dev-9.1 libxslt1-dev \
- libxml2-dev libmemcached-dev python-dev rabbitmq-server
+ libxml2-dev libmemcached-dev python-dev rabbitmq-server \
+ p7zip-full
echo "CREATE USER vagrant WITH CREATEROLE LOGIN; CREATE DATABASE karmaworld OWNER vagrant;" | su postgres -c "psql"
Finals Club (c) 2013"""
import os
+import requests
import ConfigParser
+from bs4 import BeautifulSoup as BS
from fabric.api import cd, env, lcd, prefix, run, sudo, task, local, settings
from fabric.contrib import files
env.use_ssh_config = True
+USDE_LINK = "http://ope.ed.gov/accreditation/GetDownloadFile.aspx"
######## Define host(s)
def here():
if errors:
raise Exception('\n'.join(errors))
+def fetch_accreditation():
+ """
+ Connects to USDE accreditation and drops a CSV into confs.
+ """
+ r = requests.get(USDE_LINK)
+ # Ensure the page was retrieved with 200
+ if not r.ok:
+ r.raise_for_status()
+ # Process the HTML with BeautifulSoup
+ soup = BS(r.text)
+ # Extract all the anchor links.
+ a = soup.find_all('a')
+ # TODO maybe hit up itertools for speed? Probably.
+ # Extract the HREFs from anchors.
+ def get_href(anchor):
+ return anchor.get('href')
+ a = map(get_href, a)
+ # Filter out all but the Accreditation links.
+ def contains_accreditation(link):
+ return 'Accreditation' in link and 'zip' in link
+ a = filter(contains_accreditation, a)
+ # Find the most recent. (Accreditation_YYYY_MM.zip means alphanumeric sort)
+ link = sorted(a)[-1]
+ # Download the linked file to the FS and extract the CSV
+ tempfile = '/tmp/accreditation.zip'
+ csvfile = env.proj_root + '/confs/accreditation.csv'
+ run('wget -B {0} -O {1} {2}'.format(USDE_LINK, tempfile, link))
+ run("7z e -i'!*.csv' -so {0} >> {1}".format(tempfile, csvfile))
def first_deploy():