raduga-server/fetch.py at master · codingisacopingstrategy/raduga-server · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
# -*- coding: utf-8 -*-

import urllib
from datetime import datetime, timedelta
import os

from settings import TILE_SERVER, TILE_FOLDER, GFS_FOLDER
from utils import logger

"""
This is the code that serves to download the raw precipitation data.

Run it as such: python fetch.py

It tries to find the most recent GRIB file as available from the
Global Forecast System.

No dependencies outside the Python Standard Library
"""


class AppURLopener(urllib.FancyURLopener):
    version = 'Mozilla/5.0'

urllib._urlopener = AppURLopener()


def fetch_owm():
    """
    Download the latest precipitation tiles from OpenWeatherMap.
    At zoom level 4, there are 4² × 4² = 16 × 16 = 256 tiles.

    We don’t actually use OpenWeatherMap anymore in the application.
    However, the code is still useful to download tiles from any map
    that follows the conventions layed out by OpenStreetMap:

    We used a variation of this code to download the tiles from the
    Stamen black & white map we used cached in the application.
    """
    ZOOM_LEVEL = z =  4

    def quantisised_time():
        """
        ISO representation of datetime rounded to nearest hour.
        To use for folder names etcetera.
        """
        return datetime.now().strftime("%Y-%m-%dT%H:00:00Z")


    for x in range(2 ** z):
        for y in range(2 ** z):
            uri = TILE_SERVER.format(s='a', z=z, x=x, y=y)
            # make a folder like raduga_tiles/4/5/
            path = os.path.join(TILE_FOLDER, quantisised_time(), str(z), str(x))
            if not os.path.exists(path):
                os.makedirs(path)
            output_file = os.path.join(path, '%s.png' % y)
            urllib.urlretrieve(uri, output_file)

def fetch_gfs():
    """
    Download the latest weather forecast from the Global Forecast System.
    There are some 300 different tables in the GFS data, so we ask it to
    filtered for Precipitable Water (PWAT), the information that interests us.

    The GFS data is produced every six hours. It contains information about
    the current weather situation and for 3, 6, 9, 12 etc. hours into
    the future. Because the GFS is not immediately available (in general
    several hours after the time indicated as ‘now’), we use the predictions
    of 6 hours and 9 hours into the future. This way we have a time point for
    every 3 hours.
    """
    six_hours  = timedelta(hours=6)
    nine_hours = timedelta(hours=9)
    d = datetime.utcnow()

    # Possible values for hour: [0, 6, 12, 18]
    # We do integer division by 6 to round to 6.
    d_rounded = d.replace(hour = d.hour / 6 * 6)

    while True:
        """
        Possible values for hour: [0, 6, 12, 18]

        If we don’t find the latest forecast we’ll try to go six hours each time until we get
        one that does exist (or one that we have already downloaded).
        """
        res, res6, res9 = None, None, None

        logger.debug("rounding %s hours UTC at %s to %s hours UTC at %s" %
                     (d.strftime("%H"), d.strftime("%d"), d_rounded.strftime("%H"), d_rounded.strftime("%d")))

        d6 = d_rounded + six_hours
        d9 = d_rounded + nine_hours

        slug  = d_rounded.strftime("%Y%m%d%H") # '2014040812'
        slug6 = d6.strftime("%Y%m%d%H")        # '2014040818'
        slug9 = d9.strftime("%Y%m%d%H")        # '2014040821'

        target_folder6 = os.path.join(GFS_FOLDER, slug6)
        target_folder9 = os.path.join(GFS_FOLDER, slug9)

        output_file6 = os.path.join(target_folder6, "GFS_half_degree.%s.pwat.grib" % slug6)
        output_file9 = os.path.join(target_folder9, "GFS_half_degree.%s.pwat.grib" % slug9)

        if os.path.exists(output_file9):
            # There is no need to continue looking, as we have this file already,
            # and apparently it is the most recent forecast.
            logger.debug("file %s exists already" % output_file9)
            break

        # uri = "http://nomads.ncep.noaa.gov/cgi-bin/filter_gfs_hd.pl?file=gfs.t" + d_rounded.strftime("%H") + "z.mastergrb2f00&lev_entire_atmosphere_%5C%28considered_as_a_single_layer%5C%29=on&var_PWAT=on&leftlon=0&rightlon=360&toplat=90&bottomlat=-90&dir=%2Fgfs." + slug + "%2Fmaster"
        # We get forecasts for 6 and 9 hours later:
        uri6 = "http://nomads.ncep.noaa.gov/cgi-bin/filter_gfs_hd.pl?file=gfs.t" + d_rounded.strftime("%H") + "z.mastergrb2f06&lev_entire_atmosphere_%5C%28considered_as_a_single_layer%5C%29=on&var_PWAT=on&leftlon=0&rightlon=360&toplat=90&bottomlat=-90&dir=%2Fgfs." + slug + "%2Fmaster"
        uri9 = "http://nomads.ncep.noaa.gov/cgi-bin/filter_gfs_hd.pl?file=gfs.t" + d_rounded.strftime("%H") + "z.mastergrb2f09&lev_entire_atmosphere_%5C%28considered_as_a_single_layer%5C%29=on&var_PWAT=on&leftlon=0&rightlon=360&toplat=90&bottomlat=-90&dir=%2Fgfs." + slug + "%2Fmaster"

        logger.debug("retrieving file %s" % uri9)
        res9 = urllib.urlopen(uri9)
        c = res9.getcode()
        if c == 200:
            logger.debug("retrieving file %s" % uri6)
            res6 = urllib.urlopen(uri6)
            break

        if c == 404:
            logger.debug("uri %s not available (yet)" % uri9)
        else:
            logger.debug("uri %s failed with error code %s" % (uri9, c))

        d_rounded = d_rounded - six_hours

    if res9 and res6:
        for target_folder in [target_folder9, target_folder6]:
            if not os.path.exists(target_folder):
                os.makedirs(target_folder)
        with open(output_file6, 'wb') as f:
            logger.debug("writing file %s" % output_file6)
            f.write(res6.read())
        with open(output_file9, 'wb') as f:
            logger.debug("writing file %s" % output_file9)
            f.write(res9.read())

if __name__ == '__main__':
    fetch_gfs()