Blame view

web/run.py 57.9 KB
bde97e4d   Goutte   Add more changes ...
1
2
# coding=utf-8

9390ec89   Goutte   Initial experimen...
3
import StringIO
bc18b96c   Goutte   Implement first (...
4
import datetime
8644387c   Goutte   Use real data.
5
import gzip
bc18b96c   Goutte   Implement first (...
6
7
8
import json
import logging
import random
2fedd73b   Goutte   Initial implement...
9
import tarfile
bde97e4d   Goutte   Add more changes ...
10
import time
8644387c   Goutte   Use real data.
11
import urllib
9f57dceb   Goutte   Add half the brid...
12
import requests
11d86851   Goutte   Add support for s...
13
import re  # regex
9f57dceb   Goutte   Add half the brid...
14

11d86851   Goutte   Add support for s...
15
from csv import writer as csv_writer, DictWriter as csv_dict_writer
596da00d   Goutte   Add more exceptio...
16
from math import sqrt, isnan
bc18b96c   Goutte   Implement first (...
17
18
19
from os import environ, remove as removefile
from os.path import isfile, join, abspath, dirname

fb383448   Goutte   Implement the cac...
20
from dateutil.relativedelta import relativedelta
9390ec89   Goutte   Initial experimen...
21
from flask import Flask
9390ec89   Goutte   Initial experimen...
22
from flask import request
bc18b96c   Goutte   Implement first (...
23
from flask import url_for, send_from_directory, abort as abort_flask
bde97e4d   Goutte   Add more changes ...
24
from jinja2 import Environment, FileSystemLoader, Markup
bc18b96c   Goutte   Implement first (...
25
from yaml import load as yaml_load
f10f34d1   Goutte   More logic.
26
from netCDF4 import Dataset, date2num
9390ec89   Goutte   Initial experimen...
27

dabb9d5f   Goutte   Fix the layers' c...
28

9390ec89   Goutte   Initial experimen...
29
30
31
32
33
34
# PATH RELATIVITY #############################################################

THIS_DIRECTORY = dirname(abspath(__file__))


def get_path(relative_path):
a4a9ef03   Goutte   Cache generated C...
35
    """Get an absolute path from the relative path to this script directory."""
9390ec89   Goutte   Initial experimen...
36
37
38
39
40
41
42
43
44
45
46
47
48
    return abspath(join(THIS_DIRECTORY, relative_path))


# COLLECT GLOBAL INFORMATION FROM SOURCES #####################################

# VERSION
with open(get_path('../VERSION'), 'r') as version_file:
    version = version_file.read().strip()

# CONFIG
with open(get_path('../config.yml'), 'r') as config_file:
    config = yaml_load(config_file.read())

c0df94bc   Goutte   Adding more logs.
49
FILE_DATE_FMT = "%Y-%m-%dT%H:%M:%S"
1185f353   Goutte   Fix the CME Catal...
50
MOMENT_DATE_FMT = "%Y-%m-%dT%H:%M:%SZ"
54bb1311   Goutte   Bring back the CM...
51
CME_DATE_FMT = "%Y-%m-%dT%H:%MZ"
c0df94bc   Goutte   Adding more logs.
52

6288347a   Goutte   Add the HELP page...
53
54
# Are we on the SSA instance for ESA?
SSA = environ.get('SSA') == 'true'
20fdc1a4   Goutte   Set log level fro...
55
DEBUG = environ.get('DEBUG') == 'true'
6288347a   Goutte   Add the HELP page...
56
# SSA = True
9390ec89   Goutte   Initial experimen...
57

f75faf5f   Goutte   WIP
58
59
# LOGGING #####################################################################

1324cc91   Goutte   Make the footer i...
60
61
LOG_FILE = get_path('run.log')

f75faf5f   Goutte   WIP
62
log = logging.getLogger("HelioPropa")
20fdc1a4   Goutte   Set log level fro...
63
64
65
66
if DEBUG:
    log.setLevel(logging.DEBUG)
else:
    log.setLevel(logging.ERROR)
1324cc91   Goutte   Make the footer i...
67
logHandler = logging.FileHandler(LOG_FILE)
b2837a08   Goutte   Add three retries...
68
69
70
71
logHandler.setFormatter(logging.Formatter(
    "%(asctime)s - %(levelname)s - %(message)s"
))
log.addHandler(logHandler)
f75faf5f   Goutte   WIP
72
73


e18701b6   Goutte   Cache clear (remo...
74
75
# HARDCODED CONFIGURATION #####################################################

a2034dd9   Goutte   Convert from kilo...
76
77
ASTRONOMICAL_UNIT_IN_KM = 1.496e8

952e3d8f   Goutte   Move to another s...
78
79
80
# Absolute path to the installed CDF library from https://cdf.gsfc.nasa.gov/
CDF_LIB = '/usr/local/lib/libcdf'

e18701b6   Goutte   Cache clear (remo...
81
82
83
84
# Absolute path to the data cache directory
CACHE_DIR = get_path('../cache')

# These two configs are not in the YAML config because adding a new parameter
ea45ebf9   Goutte   Add the mocks of ...
85
# will not work as-is, you'd have to edit some netcdf-related code.
e18701b6   Goutte   Cache clear (remo...
86
87
88
89
90
91

# The slugs of the available parameters in the generated CSV files.
# The order matters. If you change this you also need to change the
# innermost loop of `get_data_for_target`.
# The javascript knows the targets' properties under these names.
PROPERTIES = ('time', 'vrad', 'vtan', 'vtot', 'btan', 'temp', 'pdyn', 'dens',
d1c44c51   Goutte   Enable Earth
92
              'atse', 'xhee', 'yhee')
e18701b6   Goutte   Cache clear (remo...
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123

# The parameters that the users can handle.
# The slug MUST be one of the properties above.
PARAMETERS = {
    'pdyn': {
        'slug': 'pdyn',
        'name': 'Dyn. Pressure',
        'title': 'The dynamic pressure.',
        'units': 'nPa',
        'active': True,
        'position': 10,
    },
    'vtot': {
        'slug': 'vtot',
        'name': 'Velocity',
        'title': 'The velocity of the particles.',
        'units': 'km/s',
        'active': False,
        'position': 20,
    },
    'btan': {
        'slug': 'btan',
        'name': 'B Tangential',
        'title': 'B Tangential.',
        'units': 'nT',
        'active': False,
        'position': 30,
    },
    'temp': {
        'slug': 'temp',
        'name': 'Temperature',
60b73eb1   Goutte   Change temperatur...
124
125
        'title': 'The temperature.',
        'units': 'eV',
e18701b6   Goutte   Cache clear (remo...
126
127
128
129
130
131
132
        'active': False,
        'position': 40,
    },
    'dens': {
        'slug': 'dens',
        'name': 'Density',
        'title': 'The density N.',
aa7247d6   Goutte   Generate a CDF fi...
133
        'units': 'cm^-3',
e18701b6   Goutte   Cache clear (remo...
134
135
136
        'active': False,
        'position': 50,
    },
d1c44c51   Goutte   Enable Earth
137
138
    'atse': {
        'slug': 'atse',
e18701b6   Goutte   Cache clear (remo...
139
140
141
142
143
144
145
146
147
        'name': 'Angle T-S-E',
        'title': 'Angle Target-Sun-Earth.',
        'units': 'deg',
        'active': False,
        'position': 60,
    },
}


48fa6323   Goutte   Try to fix the he...
148
# SETUP ENVIRONMENT ###########################################################
2fe06b17   Goutte   Move the ENV dire...
149
150
151
152
153

environ['SPACEPY'] = CACHE_DIR
environ['CDF_LIB'] = CDF_LIB


9390ec89   Goutte   Initial experimen...
154
155
156
# SETUP FLASK ENGINE ##########################################################

app = Flask(__name__, root_path=THIS_DIRECTORY)
20fdc1a4   Goutte   Set log level fro...
157
app.debug = DEBUG
b2837a08   Goutte   Add three retries...
158
if app.debug:
2fedd73b   Goutte   Initial implement...
159
    log.info("Starting Flask app IN DEBUG MODE...")
b2837a08   Goutte   Add three retries...
160
161
else:
    log.info("Starting Flask app...")
9390ec89   Goutte   Initial experimen...
162
163


48fa6323   Goutte   Try to fix the he...
164
165
166
167
def handle_error(e):
    log.error(e)
    return str(e)  # wish we could use the default error renderer here

befd6269   Goutte   Add Chris' changes.
168

48fa6323   Goutte   Try to fix the he...
169
170
171
app.register_error_handler(Exception, handle_error)


9390ec89   Goutte   Initial experimen...
172
173
174
175
176
177
178
179
180
# SETUP JINJA2 TEMPLATE ENGINE ################################################

def static_global(filename):
    return url_for('static', filename=filename)


def shuffle_filter(seq):
    """
    This shuffles the sequence it is applied to.
2fedd73b   Goutte   Initial implement...
181
    Jinja2 _should_ provide this.
9390ec89   Goutte   Initial experimen...
182
183
184
185
186
187
188
189
190
191
192
    """
    try:
        result = list(seq)
        random.shuffle(result)
        return result
    except:
        return seq


def markdown_filter(value, nl2br=False, p=True):
    """
2fedd73b   Goutte   Initial implement...
193
    Converts markdown into html.
9390ec89   Goutte   Initial experimen...
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
    nl2br: set to True to replace line breaks with <br> tags
    p: set to False to remove the enclosing <p></p> tags
    """
    from markdown import markdown
    from markdown.extensions.nl2br import Nl2BrExtension
    from markdown.extensions.abbr import AbbrExtension
    extensions = [AbbrExtension()]
    if nl2br is True:
        extensions.append(Nl2BrExtension())
    markdowned = markdown(value, output_format='html5', extensions=extensions)
    if p is False:
        markdowned = markdowned.replace(r"<p>", "").replace(r"</p>", "")
    return markdowned


bde97e4d   Goutte   Add more changes ...
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
_js_escapes = {
        '\\': '\\u005C',
        '\'': '\\u0027',
        '"': '\\u0022',
        '>': '\\u003E',
        '<': '\\u003C',
        '&': '\\u0026',
        '=': '\\u003D',
        '-': '\\u002D',
        ';': '\\u003B',
        u'\u2028': '\\u2028',
        u'\u2029': '\\u2029'
}
# Escape every ASCII character with a value less than 32.
_js_escapes.update(('%c' % z, '\\u%04X' % z) for z in xrange(32))


def escapejs_filter(value):
    escaped = []
    for letter in value:
        if letter in _js_escapes:
            escaped.append(_js_escapes[letter])
        else:
            escaped.append(letter)

    return Markup("".join(escaped))

9390ec89   Goutte   Initial experimen...
236
237
238
239
240
241
242
243
244
245
246
247
tpl_engine = Environment(loader=FileSystemLoader([get_path('view')]),
                         trim_blocks=True,
                         lstrip_blocks=True)

tpl_engine.globals.update(
    url_for=url_for,
    static=static_global,
)

tpl_engine.filters['markdown'] = markdown_filter
tpl_engine.filters['md'] = markdown_filter
tpl_engine.filters['shuffle'] = shuffle_filter
bde97e4d   Goutte   Add more changes ...
248
tpl_engine.filters['escapejs'] = escapejs_filter
9390ec89   Goutte   Initial experimen...
249
250
251
252
253
254

tpl_global_vars = {
    'request': request,
    'version': version,
    'config': config,
    'now': datetime.datetime.now(),
fac54a01   Goutte   Use SSA instead o...
255
    'is_esa': SSA,
9390ec89   Goutte   Initial experimen...
256
257
258
259
260
}


# HELPERS #####################################################################

57f42bd7   Goutte   Log the abortions.
261
def abort(code, message):
b52b494b   Goutte   Add even more logs.
262
    log.error("Abort: " + message)
57f42bd7   Goutte   Log the abortions.
263
264
265
    abort_flask(code, message)


9390ec89   Goutte   Initial experimen...
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
def render_view(view, context=None):
    """
    A simple helper to render [view] template with [context] vars.
    It automatically adds the global template vars defined above, too.
    It returns a string, usually the HTML contents to display.
    """
    context = {} if context is None else context
    return tpl_engine.get_template(view).render(
        dict(tpl_global_vars.items() + context.items())
    )


# def render_page(page, title="My Page", context=None):
#     """
#     A simple helper to render the md_page.html template with [context] vars &
#     the additional contents of `page/[page].md` in the `md_page` variable.
#     It automagically adds the global template vars defined above, too.
#     It returns a string, usually the HTML contents to display.
#     """
#     if context is None:
#         context = {}
#     context['title'] = title
#     context['md_page'] = ''
#     with file(get_path('page/%s.md' % page)) as f:
#         context['md_page'] = f.read()
#     return tpl_engine.get_template('md_page.html').render(
#         dict(tpl_global_vars.items() + context.items())
#     )

077980eb   Goutte   Improve availabil...
295

bc18b96c   Goutte   Implement first (...
296
297
298
299
300
301
302
def is_list_in_list(needle, haystack):
    for n in needle:
        if n not in haystack:
            return False
    return True


1324cc91   Goutte   Make the footer i...
303
304
305
306
307
308
309
310
311
312
313
314
315
def round_time(dt=None, round_to=60):
    """
    Round a datetime object to any time laps in seconds
    dt : datetime.datetime object, default now.
    roundTo : Closest number of seconds to round to, default 1 minute.
    """
    if dt is None:
        dt = datetime.datetime.now()
    seconds = (dt.replace(tzinfo=None) - dt.min).seconds
    rounding = (seconds + round_to / 2) // round_to * round_to
    return dt + datetime.timedelta(0, rounding-seconds, -dt.microsecond)


2d2af24b   Goutte   Add a basic orbit...
316
def datetime_from_list(time_list):
0b9821dd   Goutte   Clean up.
317
    """
2fedd73b   Goutte   Initial implement...
318
    Datetimes in retrieved CDFs are stored as lists of numbers,
80352490   Goutte   Multi model suppo...
319
320
    with DayOfYear starting at 0. We want it starting at 1 because it's what
    vendor parsers use, both in python and javascript.
0b9821dd   Goutte   Clean up.
321
    """
2d2af24b   Goutte   Add a basic orbit...
322
323
324
    # Day Of Year starts at 0, but for our datetime parser it starts at 1
    doy = '{:03d}'.format(int(''.join(time_list[4:7])) + 1)
    return datetime.datetime.strptime(
50d4f638   Goutte   Hotfix for a very...
325
        "%s%s%s" % (''.join(time_list[0:4]), doy, ''.join(time_list[7:-1])),
2d2af24b   Goutte   Add a basic orbit...
326
327
        "%Y%j%H%M%S%f"
    )
9390ec89   Goutte   Initial experimen...
328

ce8af118   Goutte   Fix the favicon.
329

927c69c3   Goutte   Make the local ca...
330
331
332
333
334
335
336
337
338
339
340
341
342
343
def get_local_filename(url):
    """
    Build the local cache filename for the distant file
    :param url: string
    :return: string
    """
    from slugify import slugify
    n = len('http://')
    if url.startswith('https'):
        n += 1
    s = url[n:]
    return slugify(s)


180d7d97   Goutte   Refactor heavily.
344
def get_target_config(slug):
2fedd73b   Goutte   Initial implement...
345
    for s in config['targets']:  # dumb
8644387c   Goutte   Use real data.
346
347
        if s['slug'] == slug:
            return s
180d7d97   Goutte   Refactor heavily.
348
    raise Exception("No target found in configuration for '%s'." % slug)
8644387c   Goutte   Use real data.
349
350


180d7d97   Goutte   Refactor heavily.
351
352
353
354
def check_target_config(slug):
    get_target_config(slug)


fb383448   Goutte   Implement the cac...
355
356
357
358
359
def get_active_targets():
    all_targets = config['targets']
    return [t for t in all_targets if not ('locked' in t and t['locked'])]


11d86851   Goutte   Add support for s...
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
def validate_tap_target_config(target):
    tc = get_target_config(target)
    if 'tap' not in tc:
        raise Exception("No `tap` configuration for target `%s`." % target)
    if 'target_name' not in tc['tap']:
        raise Exception("No `target_name` in the `tap` configuration for target `%s`." % target)
    return tc


# Using pyvo would be best.
# def retrieve_auroral_emissions_vopy(target_name):
#     api_url = "http://voparis-tap.obspm.fr/__system__/tap/run/tap/sync"
#     import pyvo as vo
#     service = vo.dal.TAPService(api_url)
#     # … can't figure out how to install pyvo and spacepy alongside (forking?)


def retrieve_auroral_emissions(target_name, d_started_at=None, d_stopped_at=None):
9f57dceb   Goutte   Add half the brid...
378
379
    """
    Work In Progress.
11d86851   Goutte   Add support for s...
380
    :param target_name: You should probably not let users define this value,
9f57dceb   Goutte   Add half the brid...
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
                        as our sanitizing for ADQL may not be 100% safe.
                        Use values from YAML configuration, instead.
                        Below is a list of the ids we found to be existing.
                        > SELECT DISTINCT target_name FROM apis.epn_core
                        - Mars
                        - MERCURY
                        - Jupiter
                        - Titan
                        - Io
                        - VENUS
                        - Ganymede
                        - Uranus
                        - Callisto
                        - Europa
                        - Saturn
    :return: 
    """
11d86851   Goutte   Add support for s...
398
399
400
401

    # Try out the form
    # http://voparis-tap-planeto.obspm.fr/__system__/adql/query/form

9f57dceb   Goutte   Add half the brid...
402
    api_url = "http://voparis-tap.obspm.fr/__system__/tap/run/tap/sync"
11d86851   Goutte   Add support for s...
403
404
405
406
407
408
409
410
411
    if d_started_at is None:
        d_started_at = datetime.datetime.now()
        t_started_at = time.mktime(d_started_at.timetuple()) - 3600 * 24 * 365 * 2
        # t_started_at = 1
    else:
        t_started_at = time.mktime(d_started_at.timetuple())

    if d_stopped_at is None:
        d_stopped_at = datetime.datetime.now()
9f57dceb   Goutte   Add half the brid...
412
413
    t_stopped_at = time.mktime(d_stopped_at.timetuple())

11d86851   Goutte   Add support for s...
414
    def timestamp_to_jday(timestamp):
9f57dceb   Goutte   Add half the brid...
415
416
        return timestamp / 86400.0 + 2440587.5

11d86851   Goutte   Add support for s...
417
418
419
420
421
422
423
424
425
    def jday_to_timestamp(jday):
        return (jday - 2440587.5) * 86400.0

    def jday_to_datetime(jday):
        return datetime.datetime.utcfromtimestamp(jday_to_timestamp(jday))

    # SELECT DISTINCT dataproduct_type FROM apis.epn_core
    # > im sp sc

9f57dceb   Goutte   Add half the brid...
426
427
428
429
430
431
432
433
434
    query = """
SELECT
  time_min,
  time_max,
  thumbnail_url,
  external_link
FROM apis.epn_core
WHERE target_name='{target_name}'
AND   dataproduct_type='im'
11d86851   Goutte   Add support for s...
435
436
AND   time_min >= {jday_start}
AND   time_min <= {jday_stop}
9f57dceb   Goutte   Add half the brid...
437
438
439
ORDER BY time_min, granule_gid
""".format(
        target_name=target_name.replace("'", "\\'"),
11d86851   Goutte   Add support for s...
440
441
        jday_start=timestamp_to_jday(t_started_at),
        jday_stop=timestamp_to_jday(t_stopped_at)
9f57dceb   Goutte   Add half the brid...
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
    )

#     query = """
# SELECT DISTINCT target_name FROM apis.epn_core
# """

    try:
        response = requests.post(api_url, {
            'REQUEST': 'doQuery',
            'LANG':    'ADQL',
            'QUERY':   query,
            'TIMEOUT': '30',
            'FORMAT':  'VOTable/td'
        })

        response_xml = response.text

        import xml.etree.ElementTree as ET
        root = ET.fromstring(response_xml)
        namespaces = {'vo': 'http://www.ivoa.net/xml/VOTable/v1.3'}
        rows_xpath = "./vo:RESOURCE/vo:TABLE/vo:DATA/vo:TABLEDATA/vo:TR"
        rows = []
        for row in root.findall(rows_xpath, namespaces):
            rows.append({
11d86851   Goutte   Add support for s...
466
467
                'time_min': jday_to_datetime(float(row[0].text)),
                'time_max': jday_to_datetime(float(row[1].text)),
9f57dceb   Goutte   Add half the brid...
468
469
470
471
472
473
474
475
476
477
478
479
480
                'thumbnail_url': row[2].text,
                'external_link': row[3].text,
            })

        # print(rows)
        return rows
    except Exception as e:
        print("Failed to retrieve auroral emissions :")
        print(e)

    # print(query)


180d7d97   Goutte   Refactor heavily.
481
def retrieve_amda_netcdf(orbiter, what, started_at, stopped_at):
8644387c   Goutte   Use real data.
482
    """
91c3d52d   Goutte   Add more logs.
483
484
    Handles remote querying AMDA's API for URLs, and then downloading,
    extracting and caching the netCDF files.
8644387c   Goutte   Use real data.
485
486
487
488
489
490
491
492
493
494
495
496
    :param orbiter: key of the source in the YAML config
    :param what: either 'model' or 'orbit', a key in the config of the source
    :param started_at:
    :param stopped_at:
    :return: a list of local file paths to netCDF (.nc) files
    """

    url = config['amda'].format(
        dataSet=what,
        startTime=started_at.isoformat(),
        stopTime=stopped_at.isoformat()
    )
c50cc9d8   Goutte   Continue fixing.
497
    log.info("Fetching remote gzip files list at '%s'." % url)
b2837a08   Goutte   Add three retries...
498
499
    retries = 0
    success = False
92abc15b   Goutte   Mistrust the API ...
500
    errors = []
b2837a08   Goutte   Add three retries...
501
502
503
504
505
506
507
508
    remote_gzip_files = []
    while not success and retries < 3:
        try:
            response = urllib.urlopen(url)
            remote_gzip_files = json.loads(response.read())
            if not remote_gzip_files:
                raise Exception("Failed to fetch data at '%s'." % url)
            if remote_gzip_files == 'NODATASET':
92abc15b   Goutte   Mistrust the API ...
509
510
511
                raise Exception("API says there's no dataset at '%s'." % url)
            if remote_gzip_files == 'ERROR':
                raise Exception("API returned an error at '%s'." % url)
077980eb   Goutte   Improve availabil...
512
            if remote_gzip_files == ['OUTOFTIME']:  # it happens
80352490   Goutte   Multi model suppo...
513
514
                return []
                # raise Exception("API says it's out of time at '%s'." % url)
b2837a08   Goutte   Add three retries...
515
516
517
            success = True
        except Exception as e:
            log.warn("Failed (%d/3) '%s' : %s" % (retries+1, url, e.message))
92abc15b   Goutte   Mistrust the API ...
518
519
            remote_gzip_files = []
            errors.append(e)
b2837a08   Goutte   Add three retries...
520
521
522
        finally:
            retries += 1
    if not remote_gzip_files:
b52b494b   Goutte   Add even more logs.
523
        log.error("Failed to retrieve data from AMDA.")
91c3d52d   Goutte   Add more logs.
524
525
        log.error("Failed to fetch gzip files list for %s at '%s' : %s" %
                   (orbiter, url, errors))
08abc2d4   Goutte   Remove duplicate ...
526
527
528
529
        abort(400, "Failed to fetch gzip files list for %s at '%s' : %s" %
                   (orbiter, url, errors))
    else:
        remote_gzip_files = list(set(remote_gzip_files))
9bfa6c42   Goutte   More bug hunting.
530
531

    log.debug("Fetched remote gzip files list : %s." % str(remote_gzip_files))
8644387c   Goutte   Use real data.
532

8644387c   Goutte   Use real data.
533
534
    local_gzip_files = []
    for remote_gzip_file in remote_gzip_files:
077980eb   Goutte   Improve availabil...
535
536
537
        # hotfixes to remove when fixed upstream @Myriam
        if remote_gzip_file in ['OUTOFTIME', 'ERROR']:
            continue  # sometimes half the response is okay, the other not
8644387c   Goutte   Use real data.
538
        if remote_gzip_file.endswith('/.gz'):
80352490   Goutte   Multi model suppo...
539
            continue  # this is just a plain bug
8644387c   Goutte   Use real data.
540
        remote_gzip_file = remote_gzip_file.replace('cdpp1', 'cdpp', 1)
077980eb   Goutte   Improve availabil...
541
        ################################################
e18701b6   Goutte   Cache clear (remo...
542
        local_gzip_file = join(CACHE_DIR, get_local_filename(remote_gzip_file))
8644387c   Goutte   Use real data.
543
544
        local_gzip_files.append(local_gzip_file)
        if not isfile(local_gzip_file):
9bfa6c42   Goutte   More bug hunting.
545
            log.debug("Retrieving '%s'..." % local_gzip_file)
8644387c   Goutte   Use real data.
546
            urllib.urlretrieve(remote_gzip_file, local_gzip_file)
9bfa6c42   Goutte   More bug hunting.
547
            log.debug("Retrieved '%s'." % local_gzip_file)
dc0be992   Goutte   Support having no...
548
549
        else:
            log.debug("Found '%s' in the cache." % local_gzip_file)
8644387c   Goutte   Use real data.
550
551
552
553

    local_netc_files = []
    for local_gzip_file in local_gzip_files:
        local_netc_file = local_gzip_file[0:-3]
9bfa6c42   Goutte   More bug hunting.
554
        log.debug("Unzipping '%s'..." % local_gzip_file)
3c064b17   Goutte   Ignore failures w...
555
556
        success = True
        try:
5ef50583   Goutte   Clean up.
557
            with gzip.open(local_gzip_file) as f:
3c064b17   Goutte   Ignore failures w...
558
559
560
561
562
                file_content = f.read()
                with open(local_netc_file, 'w+b') as g:
                    g.write(file_content)
        except Exception as e:
            success = False
dc0be992   Goutte   Support having no...
563
564
565
566
567
            log.error("Cannot process gz file '%s' from '%s' : %s" %
                      (local_gzip_file, url, e))
            # Sometimes, the downloaded gz is corrupted, and CRC checks fail.
            # We want to delete the local gz file and try again next time.
            removefile(local_gzip_file)
3c064b17   Goutte   Ignore failures w...
568
        if success:
dc0be992   Goutte   Support having no...
569
            local_netc_files.append(local_netc_file)
3c064b17   Goutte   Ignore failures w...
570
            log.debug("Unzipped '%s'." % local_gzip_file)
8644387c   Goutte   Use real data.
571

ea6c8d5d   Goutte   Add interval cons...
572
    return list(set(local_netc_files))  # remove possible dupes
8644387c   Goutte   Use real data.
573
574


596da00d   Goutte   Add more exceptio...
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
# class DataParser:
#     """
#     Default data parser
#     A wip to try to handle code exeptions sanely.
#     """
#
#     # Override these using the model configuration
#     default_nc_keys = {
#         'hee': 'HEE',
#         'vtot': 'V',
#         'magn': 'B',
#         'temp': 'T',
#         'dens': 'N',
#         'pdyn': 'P_dyn',
#         'atse': 'Delta_angle',
#     }
#
#     def __init__(self, target, model):
#         self.target = target
#         self.model = model
#         pass
#
#     def _read_var(self, nc, _keys, _key, mandatory=False):
#         try:
#             return nc.variables[_keys[_key]]
#         except KeyError:
#             pass
#         if mandatory:
#             raise Exception("No variable '%s' found in NetCDF." % _keys[_key])
#         return [None] * len(nc.variables['Time'])  # slow -- use numpy?
#
#     def parse(self, cdf_handle):
#         nc_keys = self.default_nc_keys.copy()
#
#         times = cdf_handle.variables['Time']  # YYYY DOY HH MM SS .ms
#         data_v = self._read_var(cdf_handle, nc_keys, 'vtot')
#         data_b = self._read_var(cdf_handle, nc_keys, 'magn')
#         data_t = self._read_var(cdf_handle, nc_keys, 'temp')
#         data_n = self._read_var(cdf_handle, nc_keys, 'dens')
#         data_p = self._read_var(cdf_handle, nc_keys, 'pdyn')
#         data_a = self._read_var(cdf_handle, nc_keys, 'atse')
#
#         return zip()


de97d643   Goutte   Fix more bugs.
620
621
def get_data_for_target(target_config, input_slug,
                        started_at, stopped_at):
180d7d97   Goutte   Refactor heavily.
622
623
624
625
    """
    :return: dict whose keys are datetime as str, values tuples of data
    """
    log.debug("Grabbing data for '%s'..." % target_config['slug'])
80352490   Goutte   Multi model suppo...
626

8644387c   Goutte   Use real data.
627
    try:
297a7dfc   Goutte   Add support for i...
628
        models = target_config['models'][input_slug]
077980eb   Goutte   Improve availabil...
629
630
    except Exception as e:
        abort(500, "Invalid model configuration for '%s' : %s"
180d7d97   Goutte   Refactor heavily.
631
632
              % (target_config['slug'], str(e)))
    try:
80352490   Goutte   Multi model suppo...
633
        orbits = target_config['orbit']['models']
d1c44c51   Goutte   Enable Earth
634
635
636
637
    except KeyError as e:
        orbits = []
        # abort(500, "Invalid orbit configuration for '%s' : %s"
        #       % (target_config['slug'], str(e)))
28ef3790   Goutte   Clean up.
638

58bfe281   Goutte   Handle start and ...
639
640
641
642
643
644
645
646
647
648
649
    def _sta_sto(_cnf, _sta, _sto):
        if 'started_at' in _cnf:
            _s0 = datetime.datetime.strptime(_cnf['started_at'], FILE_DATE_FMT)
            _s0 = max(_s0, _sta)
        else:
            _s0 = _sta
        if 'stopped_at' in _cnf:
            _s1 = datetime.datetime.strptime(_cnf['stopped_at'], FILE_DATE_FMT)
            _s1 = min(_s1, _sto)
        else:
            _s1 = _sto
aa7247d6   Goutte   Generate a CDF fi...
650
        return _s0, _s1
80352490   Goutte   Multi model suppo...
651

d1c44c51   Goutte   Enable Earth
652
653
654
655
656
657
658
659
660
    def _read_var(_nc, _keys, _key, mandatory=False):
        try:
            return _nc.variables[_keys[_key]]
        except KeyError:
            pass
        if mandatory:
            raise Exception("No variable '%s' found in NetCDF." % _keys[_key])
        return [None] * len(_nc.variables['Time'])  # slow -- use numpy!

fd1829c3   Goutte   Use the new AMDA API
661
    # Override these using the model configuration in config.yml
d1c44c51   Goutte   Enable Earth
662
663
664
665
666
667
668
669
670
671
    default_nc_keys = {
        'hee': 'HEE',
        'vtot': 'V',
        'magn': 'B',
        'temp': 'T',
        'dens': 'N',
        'pdyn': 'P_dyn',
        'atse': 'Delta_angle',
    }

80352490   Goutte   Multi model suppo...
672
    precision = "%Y-%m-%dT%H"  # model and orbits times are only equal-ish
180d7d97   Goutte   Refactor heavily.
673
    orbit_data = {}  # keys are datetime as str, values arrays of XY
ea6c8d5d   Goutte   Add interval cons...
674
675

    for orbit in orbits:
58bfe281   Goutte   Handle start and ...
676
        s0, s1 = _sta_sto(orbit, started_at, stopped_at)
ea6c8d5d   Goutte   Add interval cons...
677

d1c44c51   Goutte   Enable Earth
678
679
680
681
        nc_keys = default_nc_keys.copy()
        if 'parameters' in orbit:
            nc_keys.update(orbit['parameters'])

ea6c8d5d   Goutte   Add interval cons...
682
683
684
685
686
687
688
689
        orbit_files = retrieve_amda_netcdf(
            target_config['slug'], orbit['slug'], s0, s1
        )
        for orbit_file in orbit_files:
            log.debug("%s: opening orbit NETCDF4 '%s'..." %
                      (target_config['name'], orbit_file))
            cdf_handle = Dataset(orbit_file, "r", format="NETCDF4")
            times = cdf_handle.variables['Time']  # YYYY DOY HH MM SS .ms
d1c44c51   Goutte   Enable Earth
690
            data_hee = _read_var(cdf_handle, nc_keys, 'hee', mandatory=True)
ea6c8d5d   Goutte   Add interval cons...
691
692
693

            log.debug("%s: aggregating data from '%s'..." %
                      (target_config['name'], orbit_file))
d1c44c51   Goutte   Enable Earth
694
            for ltime, datum_hee in zip(times, data_hee):
1324cc91   Goutte   Make the footer i...
695
                try:
d1c44c51   Goutte   Enable Earth
696
697
698
699
                    dtime = datetime_from_list(ltime)
                except Exception:
                    log.error("Failed to parse time from %s." % ltime)
                    raise
ea6c8d5d   Goutte   Add interval cons...
700
                if s0 <= dtime <= s1:
1324cc91   Goutte   Make the footer i...
701
                    dkey = round_time(dtime, 60*60).strftime(precision)
ea6c8d5d   Goutte   Add interval cons...
702
703
                    orbit_data[dkey] = datum_hee
            cdf_handle.close()
180d7d97   Goutte   Refactor heavily.
704

8644387c   Goutte   Use real data.
705
    all_data = {}  # keys are datetime as str, values tuples of data
1ab47144   Goutte   Add new menus, up...
706
    strip_before_date = None
58bfe281   Goutte   Handle start and ...
707
708
709
710
711
    for model in models:
        s0, s1 = _sta_sto(model, started_at, stopped_at)
        model_files = retrieve_amda_netcdf(
            target_config['slug'], model['slug'], s0, s1
        )
d1c44c51   Goutte   Enable Earth
712
713
714
715
        nc_keys = default_nc_keys.copy()
        if 'parameters' in model:
            nc_keys.update(model['parameters'])

129181a6   Goutte   Add more logs to ...
716
717
718
719
        if len(model_files) == 0:
            log.warn("No model data for '%s' '%s'."
                     % (target_config['slug'], model['slug']))

58bfe281   Goutte   Handle start and ...
720
        for model_file in model_files:
58bfe281   Goutte   Handle start and ...
721
722
723
            log.debug("%s: opening model NETCDF4 '%s'..." %
                      (target_config['name'], model_file))
            cdf_handle = Dataset(model_file, "r", format="NETCDF4")
596da00d   Goutte   Add more exceptio...
724

d1c44c51   Goutte   Enable Earth
725
            # log.debug(cdf_handle.variables.keys())
596da00d   Goutte   Add more exceptio...
726

58bfe281   Goutte   Handle start and ...
727
            times = cdf_handle.variables['Time']  # YYYY DOY HH MM SS .ms
d1c44c51   Goutte   Enable Earth
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
            data_v = _read_var(cdf_handle, nc_keys, 'vtot')
            data_b = _read_var(cdf_handle, nc_keys, 'magn')
            data_t = _read_var(cdf_handle, nc_keys, 'temp')
            data_n = _read_var(cdf_handle, nc_keys, 'dens')
            data_p = _read_var(cdf_handle, nc_keys, 'pdyn')
            data_a = _read_var(cdf_handle, nc_keys, 'atse')

            # Usually:
            # Time, StartTime, StopTime, V, B, N, T, Delta_angle, P_dyn
            # Earth:
            # Time, BartelsNumber, ImfID, SwID, ImfPoints,
            # SwPoints, B_M_av, B_Vec_av, B_Theta_av,
            # B_Phi_av, B, T, N, V, Vlat, Vlon,
            # Alpha, RamP, E, Beta, Ma, Kp, R, DST,
            # AE, Flux, Flag, F10_Index, StartTime, StopTime

58bfe281   Goutte   Handle start and ...
744
745
            log.debug("%s: aggregating data from '%s'..." %
                      (target_config['name'], model_file))
d1c44c51   Goutte   Enable Earth
746
747
748
            for ltime, datum_v, datum_b, datum_t, datum_n, datum_p, datum_a \
                    in zip(times, data_v, data_b, data_t, data_n, data_p, data_a):

58bfe281   Goutte   Handle start and ...
749
                try:
d1c44c51   Goutte   Enable Earth
750
751
752
753
                    dtime = datetime_from_list(ltime)
                except Exception:
                    log.error("Failed to parse time from %s." % ltime)
                    raise
596da00d   Goutte   Add more exceptio...
754

58bfe281   Goutte   Handle start and ...
755
                if s0 <= dtime <= s1:
1ab47144   Goutte   Add new menus, up...
756
757
                    droundtime = round_time(dtime, 60*60)
                    dkey = droundtime.strftime(precision)
d1c44c51   Goutte   Enable Earth
758

596da00d   Goutte   Add more exceptio...
759
760
761
                    x_hee = None
                    y_hee = None
                    if dkey in orbit_data:
a2034dd9   Goutte   Convert from kilo...
762
763
                        x_hee = orbit_data[dkey][0] / ASTRONOMICAL_UNIT_IN_KM
                        y_hee = orbit_data[dkey][1] / ASTRONOMICAL_UNIT_IN_KM
596da00d   Goutte   Add more exceptio...
764
765

                    # First exception: V may be a vector instead of a scalar
d1c44c51   Goutte   Enable Earth
766
767
768
769
770
771
772
773
774
                    if hasattr(datum_v, '__len__'):
                        vrad = datum_v[0]
                        vtan = datum_v[1]
                        vtot = sqrt(vrad * vrad + vtan * vtan)
                    else:  # eg: Earth
                        vrad = None
                        vtan = None
                        vtot = datum_v

596da00d   Goutte   Add more exceptio...
775
                    # Second exception: Earth is always at (1, 0)
d1c44c51   Goutte   Enable Earth
776
777
778
                    if target_config['slug'] == 'earth':
                        x_hee = 1
                        y_hee = 0
596da00d   Goutte   Add more exceptio...
779
780
781
782
783
784
785
786

                    # Third exception: B is a Vector3 or a Vector2 for Earth
                    if target_config['slug'] == 'earth':
                        if model['slug'] == 'omni_hour_all':  # Vector3
                            datum_b = datum_b[0]
                        # if model['slug'] == 'ace_swepam_real':  # Vector2
                        #     datum_b = datum_b[0]
                        if model['slug'] == 'omni_hour_all':
2c8f64ea   Goutte   Adjust Earth's dy...
787
                            datum_p = datum_n * vtot * vtot * 1.6726e-6
596da00d   Goutte   Add more exceptio...
788
                        if model['slug'] == 'ace_swepam_real':
2c8f64ea   Goutte   Adjust Earth's dy...
789
                            datum_p = datum_n * vtot * vtot * 1.6726e-6
596da00d   Goutte   Add more exceptio...
790
791
792
793
794
                        if vtot is None or isnan(vtot):
                            continue

                    # Keep adding exceptions here until you can't or become mad

1ab47144   Goutte   Add new menus, up...
795
796
797
798
799
800
801
802
803
804
                    first = False
                    if strip_before_date is None:
                        first = True
                        strip_before_date = droundtime

                    # First model has priority, and also sets a leftmost time
                    if first or (
                        (dkey not in all_data) and
                        (droundtime > strip_before_date)
                    ):
fd1829c3   Goutte   Use the new AMDA API
805
806
807
808
809
810
811
                        # /!\ MUST be in the same order as PROPERTIES
                        all_data[dkey] = (
                            dtime.strftime("%Y-%m-%dT%H:%M:%S+00:00"),
                            vrad, vtan, vtot,
                            datum_b, datum_t, datum_p, datum_n, datum_a,
                            x_hee, y_hee
                        )
58bfe281   Goutte   Handle start and ...
812
            cdf_handle.close()
8644387c   Goutte   Use real data.
813

180d7d97   Goutte   Refactor heavily.
814
815
816
    return all_data


297a7dfc   Goutte   Add support for i...
817
def generate_csv_contents(target_slug, input_slug, started_at, stopped_at):
180d7d97   Goutte   Refactor heavily.
818
819
820
821
822
823
    target_config = get_target_config(target_slug)
    log.debug("Crunching CSV contents for '%s'..." % target_config['name'])
    si = StringIO.StringIO()
    cw = csv_writer(si)
    cw.writerow(PROPERTIES)

297a7dfc   Goutte   Add support for i...
824
825
826
827
    all_data = get_data_for_target(
        target_config=target_config, input_slug=input_slug,
        started_at=started_at, stopped_at=stopped_at
    )
180d7d97   Goutte   Refactor heavily.
828
829

    log.debug("Writing and sorting CSV for '%s'..." % target_config['slug'])
8644387c   Goutte   Use real data.
830
831
    for dkey in sorted(all_data):
        cw.writerow(all_data[dkey])
2d2af24b   Goutte   Add a basic orbit...
832

180d7d97   Goutte   Refactor heavily.
833
    log.info("Generated CSV contents for '%s'." % target_config['slug'])
2d2af24b   Goutte   Add a basic orbit...
834
835
    return si.getvalue()

8644387c   Goutte   Use real data.
836

de97d643   Goutte   Fix more bugs.
837
838
def generate_csv_file_if_needed(target_slug, input_slug,
                                started_at, stopped_at):
297a7dfc   Goutte   Add support for i...
839
840
841
    filename = "%s_%s_%s_%s.csv" % (target_slug, input_slug,
                                    started_at.strftime(FILE_DATE_FMT),
                                    stopped_at.strftime(FILE_DATE_FMT))
e18701b6   Goutte   Cache clear (remo...
842
    local_csv_file = join(CACHE_DIR, filename)
80352490   Goutte   Multi model suppo...
843
844
845

    generate = True
    if isfile(local_csv_file):
297a7dfc   Goutte   Add support for i...
846
        # It needs to have more than one line to not be empty (headers)
80352490   Goutte   Multi model suppo...
847
848
849
850
851
852
853
854
855
        with open(local_csv_file) as f:
            cnt = 0
            for _ in f:
                cnt += 1
                if cnt > 1:
                    generate = False
                    break

    if generate:
c0df94bc   Goutte   Adding more logs.
856
857
858
        log.info("Generating CSV '%s'..." % local_csv_file)
        try:
            with open(local_csv_file, mode="w+") as f:
de97d643   Goutte   Fix more bugs.
859
860
861
862
                f.write(generate_csv_contents(
                    target_slug=target_slug, input_slug=input_slug,
                    started_at=started_at, stopped_at=stopped_at
                ))
c0df94bc   Goutte   Adding more logs.
863
864
            log.info("Generation of '%s' done." % filename)
        except Exception as e:
d1c44c51   Goutte   Enable Earth
865
866
867
            from sys import exc_info
            from traceback import extract_tb
            exc_type, exc_value, exc_traceback = exc_info()
dc0be992   Goutte   Support having no...
868
            log.error(e)
d1c44c51   Goutte   Enable Earth
869
870
            for trace in extract_tb(exc_traceback):
                log.error(trace)
5ede388f   Goutte   Make sure failed ...
871
            if isfile(local_csv_file):
92abc15b   Goutte   Mistrust the API ...
872
                log.warn("Removing failed CSV '%s'..." % local_csv_file)
5ede388f   Goutte   Make sure failed ...
873
                removefile(local_csv_file)
9bfa6c42   Goutte   More bug hunting.
874
            abort(500, "Failed creating CSV '%s' : %s" % (filename, e))
c0df94bc   Goutte   Adding more logs.
875
876


e18701b6   Goutte   Cache clear (remo...
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
def remove_all_files(in_directory):
    """
    Will throw if something horrible happens.
    Does not remove recursively (could be done with os.walk if needed).
    Does not remove directories either.
    :param in_directory: absolute path to directory
    :return:
    """
    import os

    if not os.path.isdir(in_directory):
        raise ValueError("No directory to clean at '%s'.")

    removed_files = []
    for file_name in os.listdir(in_directory):
        file_path = os.path.join(in_directory, file_name)
        if os.path.isfile(file_path):
            os.remove(file_path)
            removed_files.append(file_path)

    return removed_files


28bb4b28   Goutte   API for the cache...
900
901
def remove_files_created_before(date, in_directory):
    """
077980eb   Goutte   Improve availabil...
902
903
904
    Will throw if something horrible happens.
    Does not remove recursively (could be done with os.walk if needed).
    Does not remove directories either.
28bb4b28   Goutte   API for the cache...
905
    :param date: datetime object
077980eb   Goutte   Improve availabil...
906
    :param in_directory: absolute path to directory
28bb4b28   Goutte   API for the cache...
907
908
909
910
911
912
913
    :return:
    """
    import os
    import time

    secs = time.mktime(date.timetuple())

077980eb   Goutte   Improve availabil...
914
915
    if not os.path.isdir(in_directory):
        raise ValueError("No directory to clean at '%s'.")
28bb4b28   Goutte   API for the cache...
916
917
918
919

    removed_files = []
    for file_name in os.listdir(in_directory):
        file_path = os.path.join(in_directory, file_name)
077980eb   Goutte   Improve availabil...
920
921
922
923
924
        if os.path.isfile(file_path):
            t = os.stat(file_path)
            if t.st_ctime < secs:
                os.remove(file_path)
                removed_files.append(file_path)
28bb4b28   Goutte   API for the cache...
925
926
927
928

    return removed_files


297a7dfc   Goutte   Add support for i...
929
930
931
932
933
def get_input_slug_from_query(inp=None):
    if inp is None:
        input_slug = request.args.get('input_slug', 'l1')
    else:
        input_slug = inp
de97d643   Goutte   Fix more bugs.
934
    if input_slug not in [i['slug'] for i in config['inputs']]:
297a7dfc   Goutte   Add support for i...
935
936
937
938
        input_slug = 'l1'  # be tolerant instead of yelling loudly
    return input_slug


284f4688   Goutte   Continue layers i...
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
def get_interval_from_query():
    """
    Get the interval from the query, or from defaults.
    """
    before = relativedelta(months=2)
    after = relativedelta(months=1)
    today = datetime.datetime.now().replace(hour=0, minute=0, second=0)
    started_at = today - before
    stopped_at = today + after
    default_started_at = started_at.strftime(FILE_DATE_FMT)
    default_stopped_at = stopped_at.strftime(FILE_DATE_FMT)

    started_at = request.args.get('started_at', default_started_at)
    stopped_at = request.args.get('stopped_at', default_stopped_at)

    return started_at, stopped_at


1185f353   Goutte   Fix the CME Catal...
957
def get_catalog_layers(input_slug, target_slug, started_at, stopped_at):
0332f168   Goutte   Initial support f...
958
    """
284f4688   Goutte   Continue layers i...
959
960
    In the JSON file we have "columns" and "data".
    Of course, each JSON file has its own columns, with different conventions.
0332f168   Goutte   Initial support f...
961
962
963
964
965
    
    :param input_slug: 
    :param target_slug: 
    :return: 
    """
0332f168   Goutte   Initial support f...
966
    import json
2204c3f7   Goutte   Improve layers co...
967
968

    def _get_index_of_key(_data, _key):
2204c3f7   Goutte   Improve layers co...
969
970
971
972
973
974
975
        try:
            index = _data['columns'].index(_key)
        except ValueError:
            log.error("Key %s not found in columns of %s" % (_key, _data))
            raise
        return index

1185f353   Goutte   Fix the CME Catal...
976
977
978
979
980
981
982
983
984
    try:
        started_at = datetime.datetime.strptime(started_at, FILE_DATE_FMT)
    except:
        abort(400, "Invalid started_at parameter : '%s'." % started_at)
    try:
        stopped_at = datetime.datetime.strptime(stopped_at, FILE_DATE_FMT)
    except:
        abort(400, "Invalid stopped_at parameter : '%s'." % stopped_at)

0332f168   Goutte   Initial support f...
985
    catalog_layers = {}
1ab47144   Goutte   Add new menus, up...
986
    for config_layer in config['layers']['catalogs']:
0332f168   Goutte   Initial support f...
987
988
        if 'data' not in config_layer:
            continue
0332f168   Goutte   Initial support f...
989
990
991
992
993
994
        catalog_layers[config_layer['slug']] = []
        for cl_datum in config_layer['data']:
            if input_slug not in cl_datum:
                continue
            if target_slug not in cl_datum[input_slug]:
                continue
b03d5eb1   Goutte   Add the last CME ...
995
996
997
998
999
            if cl_datum[input_slug][target_slug] is None:
                # We used ~ in the config, there are no constraints
                constraints = []
            else:
                constraints = cl_datum[input_slug][target_slug]['constraints']
1185f353   Goutte   Fix the CME Catal...
1000

0332f168   Goutte   Initial support f...
1001
1002
            with open(get_path("../data/catalog/%s" % cl_datum['file'])) as f:
                json_data = json.load(f)
284f4688   Goutte   Continue layers i...
1003
1004
1005
                if 'start' not in cl_datum:
                    log.error("Invalid configuration: 'start' is missing.")
                    continue  # skip this
1185f353   Goutte   Fix the CME Catal...
1006
                if 'format' not in cl_datum:
54bb1311   Goutte   Bring back the CM...
1007
1008
1009
                    cl_datum['format'] = CME_DATE_FMT
                    # log.error("Invalid configuration: 'format' is missing.")
                    # continue  # skip this
284f4688   Goutte   Continue layers i...
1010
1011
1012
1013
1014
                start_index = _get_index_of_key(json_data, cl_datum['start'])
                if 'stop' not in cl_datum:
                    stop_index = start_index
                else:
                    stop_index = _get_index_of_key(json_data, cl_datum['stop'])
2204c3f7   Goutte   Improve layers co...
1015

0332f168   Goutte   Initial support f...
1016
                for json_datum in json_data['data']:
2204c3f7   Goutte   Improve layers co...
1017
                    validates_any_constraint = False
b03d5eb1   Goutte   Add the last CME ...
1018
1019
                    if 0 == len(constraints):
                        validates_any_constraint = True
2204c3f7   Goutte   Improve layers co...
1020
1021
1022
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
                    for constraint in constraints:
                        validates_constraint = True
                        for key, possible_values in constraint.iteritems():
                            actual_value = json_datum[_get_index_of_key(
                                json_data, key
                            )]
                            if actual_value not in possible_values:
                                validates_constraint = False
                                break
                        if validates_constraint:
                            validates_any_constraint = True
                            break
                    if not validates_any_constraint:
0332f168   Goutte   Initial support f...
1033
                        continue
284f4688   Goutte   Continue layers i...
1034
1035
                    start_time = json_datum[start_index]
                    stop_time = json_datum[stop_index]
1185f353   Goutte   Fix the CME Catal...
1036
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046

                    start_time = datetime.datetime.strptime(
                        start_time, cl_datum['format']
                    )
                    stop_time = datetime.datetime.strptime(
                        stop_time, cl_datum['format']
                    )

                    if start_time < started_at:
                        continue

0332f168   Goutte   Initial support f...
1047
                    catalog_layers[config_layer['slug']].append({
1185f353   Goutte   Fix the CME Catal...
1048
1049
                        'start': start_time.strftime(MOMENT_DATE_FMT),
                        'stop':  stop_time.strftime(MOMENT_DATE_FMT),
0332f168   Goutte   Initial support f...
1050
                    })
0332f168   Goutte   Initial support f...
1051
1052
1053
1054

    return catalog_layers


077980eb   Goutte   Improve availabil...
1055
1056
1057
1058
1059
1060
1061
1062
1063
1064
1065
def get_hit_counter():
    hit_count_path = get_path("../VISITS")

    if isfile(hit_count_path):
        hit_count = int(open(hit_count_path).read())
    else:
        hit_count = 1

    return hit_count


a4a9ef03   Goutte   Cache generated C...
1066
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
def increment_hit_counter():
    hit_count_path = get_path("../VISITS")

    if isfile(hit_count_path):
        hit_count = int(open(hit_count_path).read())
        hit_count += 1
    else:
        hit_count = 1

    hit_counter_file = open(hit_count_path, 'w')
    hit_counter_file.write(str(hit_count))
    hit_counter_file.close()

    return hit_count


4aaf6874   Goutte   Try fixing the ge...
1082
1083
def update_spacepy():
    """
11d86851   Goutte   Add support for s...
1084
    Importing pycdf will fail if the toolbox is not up to date.
4aaf6874   Goutte   Try fixing the ge...
1085
    """
4aaf6874   Goutte   Try fixing the ge...
1086
1087
1088
1089
1090
1091
1092
1093
1094
    try:
        log.info("Updating spacepy's toolbox…")
        import spacepy.toolbox

        spacepy.toolbox.update()
    except Exception as e:
        log.error("Failed to update spacepy : %s." % e)


077980eb   Goutte   Improve availabil...
1095
1096
1097
tpl_global_vars['visits'] = get_hit_counter()


a4a9ef03   Goutte   Cache generated C...
1098
1099
1100
# ROUTING #####################################################################

@app.route('/favicon.ico')
bde97e4d   Goutte   Add more changes ...
1101
def favicon():  # we want it served from the root, not from static/
a4a9ef03   Goutte   Cache generated C...
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
    return send_from_directory(
        join(app.root_path, 'static', 'img'),
        'favicon.ico', mimetype='image/vnd.microsoft.icon'
    )


@app.route("/")
@app.route("/home.html")
@app.route("/index.html")
def home():
077980eb   Goutte   Improve availabil...
1112
    increment_hit_counter()
bde97e4d   Goutte   Add more changes ...
1113
1114
    parameters = PARAMETERS.values()
    parameters.sort(key=lambda x: x['position'])
297a7dfc   Goutte   Add support for i...
1115
    input_slug = get_input_slug_from_query()
0332f168   Goutte   Initial support f...
1116
    targets = [t for t in config['targets'] if not t['locked']]
284f4688   Goutte   Continue layers i...
1117
    started_at, stopped_at = get_interval_from_query()
0332f168   Goutte   Initial support f...
1118
1119
    for i, target in enumerate(targets):
        targets[i]['catalog_layers'] = get_catalog_layers(
1185f353   Goutte   Fix the CME Catal...
1120
            input_slug, target['slug'], started_at, stopped_at
0332f168   Goutte   Initial support f...
1121
        )
a4a9ef03   Goutte   Cache generated C...
1122
    return render_view('home.html.jinja2', {
0332f168   Goutte   Initial support f...
1123
1124
        # 'targets': config['targets'],
        'targets': targets,
bde97e4d   Goutte   Add more changes ...
1125
        'parameters': parameters,
297a7dfc   Goutte   Add support for i...
1126
        'input_slug': input_slug,
284f4688   Goutte   Continue layers i...
1127
1128
        'started_at': started_at,
        'stopped_at': stopped_at,
a4a9ef03   Goutte   Cache generated C...
1129
1130
1131
        'planets': [s for s in config['targets'] if s['type'] == 'planet'],
        'probes':  [s for s in config['targets'] if s['type'] == 'probe'],
        'comets':  [s for s in config['targets'] if s['type'] == 'comet'],
077980eb   Goutte   Improve availabil...
1132
        'visits':  get_hit_counter(),
a4a9ef03   Goutte   Cache generated C...
1133
1134
1135
    })


64a671cd   Goutte   Add an About page.
1136
1137
@app.route("/about.html")
def about():
36961d6f   Goutte   Slightly improve ...
1138
    import uuid
64a671cd   Goutte   Add an About page.
1139
1140
    increment_hit_counter()
    return render_view('about.html.jinja2', {
36961d6f   Goutte   Slightly improve ...
1141
1142
1143
        'authors_emails': [a['mail'] for a in config['authors']],
        'uuid4': str(uuid.uuid4())[0:3],
        'visits': get_hit_counter(),
64a671cd   Goutte   Add an About page.
1144
1145
1146
    })


6288347a   Goutte   Add the HELP page...
1147
1148
1149
1150
1151
1152
1153
@app.route("/help.html")
def help():
    return render_view('help.html.jinja2', {
        'visits': get_hit_counter(),
    })


297a7dfc   Goutte   Add support for i...
1154
1155
@app.route("/<target>_<inp>_<started_at>_<stopped_at>.csv")
def download_target_csv(target, inp, started_at, stopped_at):
a4a9ef03   Goutte   Cache generated C...
1156
1157
1158
1159
    """
    Grab data and orbit data for the specified `target`,
    rearrange it and return it as a CSV file.
    `started_at` and `stopped_at` should be UTC.
297a7dfc   Goutte   Add support for i...
1160
    `inp` is the input slug, l1 or sa or sb.
a4a9ef03   Goutte   Cache generated C...
1161
    """
180d7d97   Goutte   Refactor heavily.
1162
    check_target_config(target)
a4a9ef03   Goutte   Cache generated C...
1163
    try:
c0df94bc   Goutte   Adding more logs.
1164
        started_at = datetime.datetime.strptime(started_at, FILE_DATE_FMT)
a4a9ef03   Goutte   Cache generated C...
1165
1166
1167
    except:
        abort(400, "Invalid started_at parameter : '%s'." % started_at)
    try:
c0df94bc   Goutte   Adding more logs.
1168
        stopped_at = datetime.datetime.strptime(stopped_at, FILE_DATE_FMT)
a4a9ef03   Goutte   Cache generated C...
1169
1170
    except:
        abort(400, "Invalid stopped_at parameter : '%s'." % stopped_at)
297a7dfc   Goutte   Add support for i...
1171
    input_slug = get_input_slug_from_query(inp=inp)
a4a9ef03   Goutte   Cache generated C...
1172

297a7dfc   Goutte   Add support for i...
1173
1174
1175
    filename = "%s_%s_%s_%s.csv" % (target, input_slug,
                                    started_at.strftime(FILE_DATE_FMT),
                                    stopped_at.strftime(FILE_DATE_FMT))
e18701b6   Goutte   Cache clear (remo...
1176
    local_csv_file = join(CACHE_DIR, filename)
297a7dfc   Goutte   Add support for i...
1177
1178
1179
1180
    generate_csv_file_if_needed(
        target_slug=target, input_slug=input_slug,
        started_at=started_at, stopped_at=stopped_at
    )
a4a9ef03   Goutte   Cache generated C...
1181
1182
1183
    if not isfile(local_csv_file):
        abort(500, "Could not cache CSV file at '%s'." % local_csv_file)

e18701b6   Goutte   Cache clear (remo...
1184
    return send_from_directory(CACHE_DIR, filename)
a4a9ef03   Goutte   Cache generated C...
1185
1186


297a7dfc   Goutte   Add support for i...
1187
1188
@app.route("/<targets>_<inp>_<started_at>_<stopped_at>.tar.gz")
def download_targets_tarball(targets, inp, started_at, stopped_at):
b2837a08   Goutte   Add three retries...
1189
    """
bc18b96c   Goutte   Implement first (...
1190
1191
1192
    Grab data and orbit data for each of the specified `targets`,
    in their own CSV file, and make a tarball of them.
    `started_at` and `stopped_at` should be UTC strings.
b2837a08   Goutte   Add three retries...
1193

ea6c8d5d   Goutte   Add interval cons...
1194
1195
    Note: we do not use this route anymore, but let's keep it shelved for now.

2fedd73b   Goutte   Initial implement...
1196
    targets: string list of targets' slugs, separated by `-`.
b2837a08   Goutte   Add three retries...
1197
    """
2fedd73b   Goutte   Initial implement...
1198
    separator = '-'
0511eed7   Goutte   Tarball generatio...
1199
1200
    targets = targets.split(separator)
    targets.sort()
2fedd73b   Goutte   Initial implement...
1201
1202
    targets_configs = []
    for target in targets:
b2837a08   Goutte   Add three retries...
1203
1204
        if not target:
            abort(400, "Invalid targets format : `%s`." % targets)
180d7d97   Goutte   Refactor heavily.
1205
        targets_configs.append(get_target_config(target))
2fedd73b   Goutte   Initial implement...
1206
    if 0 == len(targets_configs):
b2837a08   Goutte   Add three retries...
1207
1208
        abort(400, "No valid targets specified. What are you doing?")

b2837a08   Goutte   Add three retries...
1209
    try:
ea6c8d5d   Goutte   Add interval cons...
1210
        started_at = datetime.datetime.strptime(started_at, FILE_DATE_FMT)
b2837a08   Goutte   Add three retries...
1211
1212
1213
    except:
        abort(400, "Invalid started_at parameter : '%s'." % started_at)
    try:
ea6c8d5d   Goutte   Add interval cons...
1214
        stopped_at = datetime.datetime.strptime(stopped_at, FILE_DATE_FMT)
b2837a08   Goutte   Add three retries...
1215
1216
    except:
        abort(400, "Invalid stopped_at parameter : '%s'." % stopped_at)
ea6c8d5d   Goutte   Add interval cons...
1217
1218
    sta = started_at.strftime(FILE_DATE_FMT)
    sto = stopped_at.strftime(FILE_DATE_FMT)
b2837a08   Goutte   Add three retries...
1219

297a7dfc   Goutte   Add support for i...
1220
1221
1222
1223
1224
    input_slug = get_input_slug_from_query(inp=inp)

    gzip_filename = "%s_%s_%s_%s.tar.gz" % (
        separator.join(targets), input_slug, sta, sto
    )
e18701b6   Goutte   Cache clear (remo...
1225
    local_gzip_file = join(CACHE_DIR, gzip_filename)
2fedd73b   Goutte   Initial implement...
1226
1227

    if not isfile(local_gzip_file):
0511eed7   Goutte   Tarball generatio...
1228
        log.debug("Creating the CSV files for the tarball...")
2fedd73b   Goutte   Initial implement...
1229
        for target_config in targets_configs:
297a7dfc   Goutte   Add support for i...
1230
1231
1232
            filename = "%s_%s_%s_%s.csv" % (
                target_config['slug'], input_slug, sta, sto
            )
e18701b6   Goutte   Cache clear (remo...
1233
            local_csv_file = join(CACHE_DIR, filename)
2fedd73b   Goutte   Initial implement...
1234
1235
            if not isfile(local_csv_file):
                with open(local_csv_file, mode="w+") as f:
297a7dfc   Goutte   Add support for i...
1236
1237
1238
1239
1240
1241
                    f.write(generate_csv_contents(
                        target_slug=target_config['slug'],
                        started_at=started_at,
                        stopped_at=stopped_at,
                        input_slug=input_slug
                    ))
2fedd73b   Goutte   Initial implement...
1242

0511eed7   Goutte   Tarball generatio...
1243
        log.debug("Creating the tarball '%s'..." % local_gzip_file)
2fedd73b   Goutte   Initial implement...
1244
1245
        with tarfile.open(local_gzip_file, "w:gz") as tar:
            for target_config in targets_configs:
297a7dfc   Goutte   Add support for i...
1246
1247
1248
                filename = "%s_%s_%s_%s.csv" % (
                    target_config['slug'], input_slug, sta, sto
                )
e18701b6   Goutte   Cache clear (remo...
1249
                local_csv_file = join(CACHE_DIR, filename)
2fedd73b   Goutte   Initial implement...
1250
1251
1252
                tar.add(local_csv_file, arcname=filename)

    if not isfile(local_gzip_file):
0511eed7   Goutte   Tarball generatio...
1253
        abort(500, "No tarball to serve. Looked at '%s'." % local_gzip_file)
2fedd73b   Goutte   Initial implement...
1254

e18701b6   Goutte   Cache clear (remo...
1255
    return send_from_directory(CACHE_DIR, gzip_filename)
b2837a08   Goutte   Add three retries...
1256

28bb4b28   Goutte   API for the cache...
1257

297a7dfc   Goutte   Add support for i...
1258
1259
@app.route("/<targets>_<inp>_<params>_<started_at>_<stopped_at>.nc")
def download_targets_netcdf(targets, inp, params, started_at, stopped_at):
bc18b96c   Goutte   Implement first (...
1260
    """
4aaf6874   Goutte   Try fixing the ge...
1261
1262
    NOTE : This is not used anymore.
    
bc18b96c   Goutte   Implement first (...
1263
    Grab data and orbit data for the specified `target`,
aa7247d6   Goutte   Generate a CDF fi...
1264
    rearrange it and return it as a NetCDF file.
e18701b6   Goutte   Cache clear (remo...
1265
    `started_at` and `stopped_at` are expected to be UTC.
bc18b96c   Goutte   Implement first (...
1266
1267
1268
1269

    targets: string list of targets' slugs, separated by `-`.
    params: string list of targets' parameters, separated by `-`.
    """
e18701b6   Goutte   Cache clear (remo...
1270
    separator = '-'  # /!\ this char should never be in target's slugs
bc18b96c   Goutte   Implement first (...
1271
1272
1273
1274
1275
1276
1277
1278
1279
    targets = targets.split(separator)
    targets.sort()
    targets_configs = []
    for target in targets:
        if not target:
            abort(400, "Invalid targets format : `%s`." % targets)
        targets_configs.append(get_target_config(target))
    if 0 == len(targets_configs):
        abort(400, "No valid targets specified. What are you doing?")
4aaf6874   Goutte   Try fixing the ge...
1280

bc18b96c   Goutte   Implement first (...
1281
1282
1283
1284
1285
1286
1287
    params = params.split(separator)
    params.sort()
    if 0 == len(params):
        abort(400, "No valid parameters specified. What are you doing?")
    if not is_list_in_list(params, PARAMETERS.keys()):
        abort(400, "Some parameters are not recognized in '%s'." % str(params))

57493104   Goutte   Add the time to t...
1288
    date_fmt = FILE_DATE_FMT
bc18b96c   Goutte   Implement first (...
1289
1290
1291
1292
1293
1294
1295
1296
1297
1298
1299
    try:
        started_at = datetime.datetime.strptime(started_at, date_fmt)
    except:
        abort(400, "Invalid started_at parameter : '%s'." % started_at)
    try:
        stopped_at = datetime.datetime.strptime(stopped_at, date_fmt)
    except:
        abort(400, "Invalid stopped_at parameter : '%s'." % stopped_at)
    sta = started_at.strftime(date_fmt)
    sto = stopped_at.strftime(date_fmt)

297a7dfc   Goutte   Add support for i...
1300
1301
1302
1303
1304
    input_slug = get_input_slug_from_query(inp=inp)

    nc_filename = "%s_%s_%s_%s_%s.nc" % (
        separator.join(targets), separator.join(params), input_slug, sta, sto
    )
e18701b6   Goutte   Cache clear (remo...
1305
    nc_path = join(CACHE_DIR, nc_filename)
bc18b96c   Goutte   Implement first (...
1306
1307
1308
1309
1310

    if not isfile(nc_path):
        log.debug("Creating the NetCDF file '%s'..." % nc_filename)
        nc_handle = Dataset(nc_path, "w", format="NETCDF4")
        try:
ea6c8d5d   Goutte   Add interval cons...
1311
            nc_handle.description = "Model and orbit data for targets"  # todo
bc18b96c   Goutte   Implement first (...
1312
            nc_handle.history = "Created " + time.ctime(time.time())
ea6c8d5d   Goutte   Add interval cons...
1313
            nc_handle.source = "Heliopropa (CDDP)"
bc18b96c   Goutte   Implement first (...
1314
1315
1316
1317
1318
            available_params = list(PROPERTIES)
            for target in targets_configs:
                target_slug = target['slug']
                log.debug("Adding group '%s' to the NetCDF..." % target_slug)
                nc_group = nc_handle.createGroup(target_slug)
297a7dfc   Goutte   Add support for i...
1319
1320
1321
1322
                data = get_data_for_target(
                    target_config=target, input_slug=input_slug,
                    started_at=started_at, stopped_at=stopped_at
                )
bc18b96c   Goutte   Implement first (...
1323
                dkeys = sorted(data)
ceeb2f4a   Goutte   Add the target co...
1324
1325
                dimension = 'dim_'+target_slug
                nc_handle.createDimension(dimension, len(dkeys))
57493104   Goutte   Add the time to t...
1326
1327

                # TIME #
ceeb2f4a   Goutte   Add the target co...
1328
                nc_time = nc_group.createVariable('time', 'i8', (dimension,))
57493104   Goutte   Add the time to t...
1329
1330
1331
1332
1333
1334
1335
1336
1337
1338
1339
1340
                nc_time.units = "hours since 1970-01-01 00:00:00"
                nc_time.calendar = "standard"
                times = []
                for dkey in dkeys:
                    time_as_string = data[dkey][0][:-6]  # remove +00:00 tail
                    date = datetime.datetime.strptime(time_as_string, date_fmt)
                    times.append(date2num(
                        date, units=nc_time.units, calendar=nc_time.calendar
                    ))
                nc_time[:] = times

                # SELECTED PARAMETERS #
bc18b96c   Goutte   Implement first (...
1341
1342
1343
1344
                nc_vars = []
                indices = []
                for param in params:
                    indices.append(available_params.index(param))
ceeb2f4a   Goutte   Add the target co...
1345
                    nc_var = nc_group.createVariable(param, 'f8', (dimension,))
5a6d4498   Goutte   Add a title to ea...
1346
                    nc_var.units = PARAMETERS[param]['units']
bc18b96c   Goutte   Implement first (...
1347
1348
1349
1350
1351
1352
1353
1354
                    nc_vars.append(nc_var)
                for i, nc_var in enumerate(nc_vars):
                    index = indices[i]
                    values = []
                    for dkey in dkeys:
                        dval = data[dkey]
                        values.append(dval[index])
                    nc_var[:] = values
ceeb2f4a   Goutte   Add the target co...
1355
1356

                # ORBIT #
6491a1f1   Goutte   Fix up the bugs l...
1357
                nc_x = nc_group.createVariable('xhee', 'f8', (dimension,))
ceeb2f4a   Goutte   Add the target co...
1358
                nc_x.units = 'Au'
6491a1f1   Goutte   Fix up the bugs l...
1359
                nc_y = nc_group.createVariable('yhee', 'f8', (dimension,))
ceeb2f4a   Goutte   Add the target co...
1360
1361
1362
                nc_y.units = 'Au'
                values_x = []
                values_y = []
6491a1f1   Goutte   Fix up the bugs l...
1363
1364
                index_x = available_params.index('xhee')
                index_y = available_params.index('yhee')
ceeb2f4a   Goutte   Add the target co...
1365
1366
1367
1368
1369
1370
1371
1372
                for dkey in dkeys:
                    dval = data[dkey]
                    values_x.append(dval[index_x])
                    values_y.append(dval[index_y])
                nc_x[:] = values_x
                nc_y[:] = values_y
            log.debug("Writing NetCDF '%s'..." % nc_filename)

d1c44c51   Goutte   Enable Earth
1373
        except Exception:
57493104   Goutte   Add the time to t...
1374
            log.error("Failed to generate NetCDF '%s'." % nc_filename)
d1c44c51   Goutte   Enable Earth
1375
            raise
bc18b96c   Goutte   Implement first (...
1376
1377
1378
1379
1380
1381
        finally:
            nc_handle.close()

    if not isfile(nc_path):
        abort(500, "No NetCDF to serve. Looked at '%s'." % nc_path)

e18701b6   Goutte   Cache clear (remo...
1382
    return send_from_directory(CACHE_DIR, nc_filename)
bc18b96c   Goutte   Implement first (...
1383
1384


297a7dfc   Goutte   Add support for i...
1385
1386
@app.route("/<targets>_<inp>_<started_at>_<stopped_at>.cdf")
def download_targets_cdf(targets, inp, started_at, stopped_at):
aa7247d6   Goutte   Generate a CDF fi...
1387
1388
1389
1390
1391
1392
1393
1394
1395
1396
1397
1398
1399
1400
1401
1402
1403
1404
1405
1406
    """
    Grab data and orbit data for the specified `target`,
    rearrange it and return it as a CDF file.
    `started_at` and `stopped_at` are expected to be UTC.

    targets: string list of targets' slugs, separated by `-`.
    params: string list of targets' parameters, separated by `-`.
    """
    separator = '-'  # /!\ this char should never be in target's slugs
    targets = targets.split(separator)
    targets.sort()
    targets_configs = []
    for target in targets:
        if not target:
            abort(400, "Invalid targets format : `%s`." % targets)
        targets_configs.append(get_target_config(target))
    if 0 == len(targets_configs):
        abort(400, "No valid targets specified. What are you doing?")

    params = PARAMETERS.keys()
aa7247d6   Goutte   Generate a CDF fi...
1407
1408
1409
1410
1411
1412
1413
1414
1415
1416
1417
1418

    try:
        started_at = datetime.datetime.strptime(started_at, FILE_DATE_FMT)
    except:
        abort(400, "Invalid started_at parameter : '%s'." % started_at)
    try:
        stopped_at = datetime.datetime.strptime(stopped_at, FILE_DATE_FMT)
    except:
        abort(400, "Invalid stopped_at parameter : '%s'." % stopped_at)
    sta = started_at.strftime(FILE_DATE_FMT)
    sto = stopped_at.strftime(FILE_DATE_FMT)

297a7dfc   Goutte   Add support for i...
1419
1420
1421
1422
1423
    input_slug = get_input_slug_from_query(inp=inp)

    cdf_filename = "%s_%s_%s_%s.cdf" % (
        separator.join(targets), input_slug, sta, sto
    )
aa7247d6   Goutte   Generate a CDF fi...
1424
1425
1426
1427
    cdf_path = join(CACHE_DIR, cdf_filename)

    if not isfile(cdf_path):
        log.debug("Creating the CDF file '%s'..." % cdf_filename)
604616e4   Goutte   Misc changes from...
1428
        try:
8a48d5fa   Goutte   Make sure spacepy...
1429
            from spacepy import pycdf
4aaf6874   Goutte   Try fixing the ge...
1430
1431
1432
1433
1434
1435
1436
1437
1438
        except ImportError:
            # If spacepy's toolbox is not up-to-date, importing will fail.
            # So, let's update and try again !
            update_spacepy()
            try:
                from spacepy import pycdf
            except ImportError as e:
                log.error("Failed to import pycdf from spacepy : %s" % e)
                raise
2fe06b17   Goutte   Move the ENV dire...
1439
1440
1441
        except Exception as e:
            log.error("Failed to import pycdf from spacepy : %s" % e)
            raise
4aaf6874   Goutte   Try fixing the ge...
1442

8a48d5fa   Goutte   Make sure spacepy...
1443
        try:
952e3d8f   Goutte   Move to another s...
1444
            cdf_handle = pycdf.CDF(cdf_path, masterpath='')
54bb1311   Goutte   Bring back the CM...
1445
1446
            targets_names = ', '.join([t['name'] for t in targets_configs])
            description = "Model and orbit data for %s." % targets_names
952e3d8f   Goutte   Move to another s...
1447
1448
1449
            cdf_handle.attrs['Description'] = description
            cdf_handle.attrs['Author'] = "Heliopropa.irap.omp.eu (CDPP)"
            cdf_handle.attrs['Created'] = str(time.ctime(time.time()))
aa7247d6   Goutte   Generate a CDF fi...
1450

54bb1311   Goutte   Bring back the CM...
1451
1452
1453
1454
            # fixme: Try changing the name from 00 to something relevant
            cdf_handle.attrs['Title'] = "Heliopropa - %s" % targets_names
            #######

aa7247d6   Goutte   Generate a CDF fi...
1455
1456
1457
            available_params = list(PROPERTIES)
            for target in targets_configs:
                target_slug = target['slug']
297a7dfc   Goutte   Add support for i...
1458
1459
1460
1461
                data = get_data_for_target(
                    target_config=target, input_slug=input_slug,
                    started_at=started_at, stopped_at=stopped_at
                )
aa7247d6   Goutte   Generate a CDF fi...
1462
1463
1464
                dkeys = sorted(data)

                values = []
aa7247d6   Goutte   Generate a CDF fi...
1465
                for dkey in dkeys:
952e3d8f   Goutte   Move to another s...
1466
1467
1468
1469
                    time_str = data[dkey][0][:-6]  # remove +00:00 tail
                    date = datetime.datetime.strptime(time_str, FILE_DATE_FMT)
                    values.append(date)
                kt = "%s_time" % target_slug
4aaf6874   Goutte   Try fixing the ge...
1470
                cdf_handle.new(kt, type=pycdf.const.CDF_EPOCH)
952e3d8f   Goutte   Move to another s...
1471
                cdf_handle[kt] = values
4aaf6874   Goutte   Try fixing the ge...
1472
                # cdf_handle[kt].attrs['FIELDNAM'] = "Time since 0 A.D"
aa7247d6   Goutte   Generate a CDF fi...
1473
1474
1475

                for param in params:
                    k = "%s_%s" % (target_slug, param)
4aaf6874   Goutte   Try fixing the ge...
1476
                    # print("PARAM %s" % k)
aa7247d6   Goutte   Generate a CDF fi...
1477
1478
                    values = []
                    i = available_params.index(param)
4aaf6874   Goutte   Try fixing the ge...
1479
                    has_nones = False
aa7247d6   Goutte   Generate a CDF fi...
1480
                    for dkey in dkeys:
4aaf6874   Goutte   Try fixing the ge...
1481
1482
1483
1484
1485
1486
1487
1488
1489
                        value = data[dkey][i]
                        if value is None:
                            has_nones = True
                        values.append(value)
                    if has_nones:
                        # PyCDF hates it when there are Nones.
                        # Since we don't know what value to set instead,
                        # let's skip the param altogether.
                        continue
aa7247d6   Goutte   Generate a CDF fi...
1490
                    cdf_handle[k] = values
952e3d8f   Goutte   Move to another s...
1491
1492
1493
1494
1495
1496
1497
1498
1499
1500
                    attrs = cdf_handle[k].attrs
                    attrs['UNITS'] = PARAMETERS[param]['units']
                    attrs['LABLAXIS'] = PARAMETERS[param]['name']
                    attrs['FIELDNAM'] = PARAMETERS[param]['title']
                    if values:
                        attrs['VALIDMIN'] = min(values)
                        attrs['VALIDMAX'] = max(values)

                kx = "%s_xhee" % target_slug
                ky = "%s_yhee" % target_slug
aa7247d6   Goutte   Generate a CDF fi...
1501
1502
1503
1504
1505
                values_xhee = []
                values_yhee = []
                index_x = available_params.index('xhee')
                index_y = available_params.index('yhee')
                for dkey in dkeys:
391d581c   Goutte   Make the CDF down...
1506
1507
1508
                    value_xhee = data[dkey][index_x]
                    value_yhee = data[dkey][index_y]
                    # We've got some `None`s cropping up in the data sometimes.
4aaf6874   Goutte   Try fixing the ge...
1509
                    # PyCDF does not digest Nones at all.
391d581c   Goutte   Make the CDF down...
1510
1511
1512
1513
1514
                    # While they solve this upstream, let's make an ugly fix!
                    if (value_xhee is not None) and (value_yhee is not None):
                        values_xhee.append(value_xhee)
                        values_yhee.append(value_yhee)
                    else:
4aaf6874   Goutte   Try fixing the ge...
1515
1516
                        values_xhee.append(0)
                        values_yhee.append(0)
391d581c   Goutte   Make the CDF down...
1517
                        log.warn("Orbit data for %s has NaNs." % target_slug)
952e3d8f   Goutte   Move to another s...
1518
1519
1520
1521
                cdf_handle[kx] = values_xhee
                cdf_handle[ky] = values_yhee
                cdf_handle[kx].attrs['UNITS'] = 'Au'
                cdf_handle[ky].attrs['UNITS'] = 'Au'
aa7247d6   Goutte   Generate a CDF fi...
1522
1523

            log.debug("Writing CDF '%s'..." % cdf_filename)
952e3d8f   Goutte   Move to another s...
1524
1525
            cdf_handle.close()
            log.debug("Wrote CDF '%s'." % cdf_filename)
aa7247d6   Goutte   Generate a CDF fi...
1526
1527
1528

        except Exception as e:
            log.error("Failed to generate CDF '%s'." % cdf_filename)
952e3d8f   Goutte   Move to another s...
1529
1530
            if isfile(cdf_path):
                removefile(cdf_path)
aa7247d6   Goutte   Generate a CDF fi...
1531
1532
            raise

aa7247d6   Goutte   Generate a CDF fi...
1533
1534
1535
1536
1537
1538
    if not isfile(cdf_path):
        abort(500, "No CDF to serve. Looked at '%s'." % cdf_path)

    return send_from_directory(CACHE_DIR, cdf_filename)


11d86851   Goutte   Add support for s...
1539
1540
1541
1542
1543
1544
1545
1546
1547
1548
1549
1550
1551
1552
1553
1554
1555
1556
1557
1558
1559
1560
1561
1562
1563
1564
1565
1566
1567
1568
1569
1570
1571
1572
1573
1574
1575
1576
1577
1578
1579
1580
1581
1582
1583
1584
1585
1586
1587
1588
1589
1590
1591
1592
1593
@app.route("/<target>_auroral_catalog.csv")
def download_auroral_catalog_csv(target):
    tc = validate_tap_target_config(target)
    log.debug("Requesting auroral emissions CSV for %s..." % tc['name'])

    filename = "%s_auroral_catalog.csv" % (target)
    local_csv_file = join(CACHE_DIR, filename)


    target_name = tc['tap']['target_name']
    emissions = retrieve_auroral_emissions(target_name)

    # Be careful with regexes in python 2 ; best always use the ^$
    thumbnail_url_filter = re.compile("^.*proc(?:_small)?\\.(?:jpe?g|png|webp|gif|bmp|tiff)$")

    # Filter the emissions
    def _keep_emission(emission):
        ok = thumbnail_url_filter.match(emission['thumbnail_url'])
        # print("ok", ok, emission['thumbnail_url'])
        return bool(ok)

    emissions = [e for e in emissions if _keep_emission(e)]

    header = ('time_min', 'time_max', 'thumbnail_url', 'external_link')
    if len(emissions):
        header = emissions[0].keys()
    si = StringIO.StringIO()
    cw = csv_dict_writer(si, fieldnames=header)
    cw.writeheader()
    # 'time_min', 'time_max', 'thumbnail_url', 'external_link'
    #cw.writerow(head)

    log.debug("Writing auroral emissions CSV for %s..." % tc['name'])
    cw.writerows(emissions)

    log.info("Generated auroral emissions CSV contents for %s." % tc['name'])
    return si.getvalue()

    # if not isfile(local_csv_file):
    #     abort(500, "Could not cache CSV file at '%s'." % local_csv_file)
    #
    # return send_from_directory(CACHE_DIR, filename)




@app.route("/test/auroral/<target>")
def test_auroral_emissions(target):
    tc = validate_tap_target_config(target)
    target_name = tc['tap']['target_name']
    retrieved = retrieve_auroral_emissions(target_name)

    return "%d results:\n%s" % (len(retrieved), str(retrieved))


28bb4b28   Goutte   API for the cache...
1594
1595
# API #########################################################################

e18701b6   Goutte   Cache clear (remo...
1596
1597
1598
1599
1600
1601
1602
1603
1604
1605
1606
1607
@app.route("/cache/clear")
def cache_clear():
    """
    Removes all files from the cache.
    Note: It also removes the .gitkeep file. Not a problem for prod.
    """
    removed_files = remove_all_files(CACHE_DIR)
    count = len(removed_files)
    return "Cache cleared! Removed %d file%s." \
           % (count, 's' if count != 1 else '')


d9710a98   Goutte   Rename the cleanu...
1608
1609
@app.route("/cache/cleanup")
def cache_cleanup():
28bb4b28   Goutte   API for the cache...
1610
1611
    """
    Removes all files from the cache that are older than roughly one month.
e18701b6   Goutte   Cache clear (remo...
1612
    Note: It also removes the .gitkeep file. Maybe it should not, but hey.
28bb4b28   Goutte   API for the cache...
1613
1614
    """
    a_month_ago = datetime.datetime.now() - datetime.timedelta(days=32)
e18701b6   Goutte   Cache clear (remo...
1615
    removed_files = remove_files_created_before(a_month_ago, CACHE_DIR)
d9710a98   Goutte   Rename the cleanu...
1616
1617
1618
    count = len(removed_files)
    return "Cache cleaned! Removed %d old file%s." \
           % (count, 's' if count != 1 else '')
28bb4b28   Goutte   API for the cache...
1619
1620


b500e561   Goutte   Invert the orbits...
1621
1622
1623
1624
@app.route("/cache/warmup")
def cache_warmup():
    """
    Warms up the cache for the current day.
b500e561   Goutte   Invert the orbits...
1625
    """
390a3587   Goutte   Add a CRON config...
1626
    warmup_started_at = datetime.datetime.now()
284f4688   Goutte   Continue layers i...
1627
    sta, sto = get_interval_from_query()
297a7dfc   Goutte   Add support for i...
1628
    inp = 'l1'  # default input, maybe warm them all up ?
fb383448   Goutte   Implement the cac...
1629
1630

    targets = get_active_targets()
fb383448   Goutte   Implement the cac...
1631
1632
    targets_slugs = [target['slug'] for target in targets]
    targets_slugs.sort()
4aaf6874   Goutte   Try fixing the ge...
1633
1634
1635
1636

    update_spacepy()
    for target in targets:
        download_target_csv(target['slug'], inp, sta, sto)
297a7dfc   Goutte   Add support for i...
1637
    download_targets_cdf('-'.join(targets_slugs), inp, sta, sto)
fb383448   Goutte   Implement the cac...
1638

390a3587   Goutte   Add a CRON config...
1639
1640
1641
1642
    warmup_ended_at = datetime.datetime.now()
    warmup_timedelta = warmup_ended_at - warmup_started_at

    return "Done in %s." % str(warmup_timedelta)
b500e561   Goutte   Invert the orbits...
1643
1644


1324cc91   Goutte   Make the footer i...
1645
@app.route("/log")
596da00d   Goutte   Add more exceptio...
1646
@app.route("/log.html")
1324cc91   Goutte   Make the footer i...
1647
1648
def log_show():
    with open(LOG_FILE, 'r') as f:
bde97e4d   Goutte   Add more changes ...
1649
        contents = f.read()
fb383448   Goutte   Implement the cac...
1650
    return "<pre>" + contents + "</pre>"
bde97e4d   Goutte   Add more changes ...
1651
1652


1324cc91   Goutte   Make the footer i...
1653
1654
1655
1656
1657
1658
1659
@app.route("/log/clear")
def log_clear():
    with open(LOG_FILE, 'w') as f:
        f.truncate()
    return "Log cleared successfully."


1754789b   Goutte   Decorate and clea...
1660
1661
1662
1663
# DEV TOOLS ###################################################################

# @app.route("/inspect")
# def analyze_cdf():
a4a9ef03   Goutte   Cache generated C...
1664
#     """
1754789b   Goutte   Decorate and clea...
1665
#     For debug purposes.
a4a9ef03   Goutte   Cache generated C...
1666
#     """
1754789b   Goutte   Decorate and clea...
1667
1668
#     cdf_to_inspect = get_path("../res/dummy.nc")
#     cdf_to_inspect = get_path("../res/dummy_jupiter_coordinates.nc")
a4a9ef03   Goutte   Cache generated C...
1669
1670
#
#     si = StringIO.StringIO()
1754789b   Goutte   Decorate and clea...
1671
1672
#     cw = csv.DictWriter(si, fieldnames=['Name', 'Shape', 'Length'])
#     cw.writeheader()
a4a9ef03   Goutte   Cache generated C...
1673
#
1754789b   Goutte   Decorate and clea...
1674
1675
1676
1677
1678
1679
1680
1681
1682
1683
#     # Time, StartTime, StopTime, V, B, N, T, Delta_angle, P_dyn, QualityFlag
#     cdf_handle = Dataset(cdf_to_inspect, "r", format="NETCDF4")
#     for variable in cdf_handle.variables:
#         v = cdf_handle.variables[variable]
#         cw.writerow({
#             'Name': variable,
#             'Shape': v.shape,
#             'Length': v.size,
#         })
#     cdf_handle.close()
a4a9ef03   Goutte   Cache generated C...
1684
1685
1686
1687
#
#     return si.getvalue()


9390ec89   Goutte   Initial experimen...
1688
1689
1690
# MAIN ########################################################################

if __name__ == "__main__":
952e3d8f   Goutte   Move to another s...
1691
    # Debug mode is on, as the production server does not use this but run.wsgi
9390ec89   Goutte   Initial experimen...
1692
1693
    extra_files = [get_path('../config.yml')]
    app.run(debug=True, extra_files=extra_files)