Juni Kim
2 years ago
9 changed files with 291 additions and 5 deletions
-
1.gitignore
-
0__init__.py
-
95app.py
-
10templates/admin.html
-
0templates/batch.html
-
21templates/batchadd.html
-
47templates/batchquery.html
-
118validate.py
@ -0,0 +1,21 @@ |
|||
{% extends "base.html" %} |
|||
|
|||
{% block content %} |
|||
<h2>Batch Upload Chemicals</h2> |
|||
<a href="https://git.junickim.me/junikimm717/walker-database/raw/master/validate.py"> Source Code with required type definitions </a> |
|||
|
|||
<form method="post" enctype="multipart/form-data"> |
|||
<label for="csv">CSV: </label> |
|||
<input type="file" name="csv"> |
|||
<input type="submit" value="Submit"> |
|||
</form> |
|||
|
|||
{% if invalid %} |
|||
<p style="color: red;">Data Points are Incorrectly added: {{invalid}}</p> |
|||
{% endif %} |
|||
|
|||
{% if success %} |
|||
<p style="color: green;">Success!</p> |
|||
{% endif %} |
|||
|
|||
{% endblock %} |
@ -0,0 +1,47 @@ |
|||
{% extends "base.html" %} |
|||
|
|||
{% block content %} |
|||
<h2>Batch Query Chemicals</h2> |
|||
<a href="https://git.junickim.me/junikimm717/walker-database/raw/master/validate.py"> Source Code with required type definitions </a> |
|||
|
|||
<form method="post" enctype="multipart/form-data"> |
|||
<label for="csv">CSV: </label> |
|||
<input type="file" name="csv"> |
|||
<input type="submit" value="Submit"> |
|||
</form> |
|||
|
|||
{% if invalid %} |
|||
<p style="color: red;">Data Points are Incorrectly added: {{invalid}}</p> |
|||
{% endif %} |
|||
|
|||
{% if success %} |
|||
<p style="color: green;">Success!</p> |
|||
{% for result in data %} |
|||
<hr> |
|||
<h2>Query {{loop.index}}</h2> |
|||
<p> |
|||
{{result.query.mz_min}} < M/Z Ratio < {{result.query.mz_max}}, |
|||
{{result.query.rt_min}} < Retention Time < {{result.query.rt_max}} |
|||
</p> |
|||
{% for hit in result.hits %} |
|||
<div> |
|||
<a href="{{hit.url}}"> |
|||
<h3>{{hit.name}}</h3> |
|||
</a> |
|||
<table> |
|||
<tr> |
|||
<td>Retention Time</td> |
|||
<td>{{hit.rt}}</td> |
|||
</tr> |
|||
<tr> |
|||
<td>M/Z Ratio</td> |
|||
<td>{{hit.mz}}</td> |
|||
</tr> |
|||
</table> |
|||
</div> |
|||
{% endfor %} |
|||
{% endfor %} |
|||
|
|||
{% endif %} |
|||
|
|||
{% endblock %} |
@ -0,0 +1,118 @@ |
|||
import csv |
|||
from datetime import date |
|||
|
|||
_required_fields = [ |
|||
("name", "str"), |
|||
("formula", "str"), |
|||
("mass", "float"), |
|||
|
|||
("final_mz", "float"), |
|||
("final_rt", "float"), |
|||
] |
|||
|
|||
_optional_fields = [ |
|||
("chemical_db_id", "str"), |
|||
("library", "str"), |
|||
|
|||
("pubchem_cid", "int"), |
|||
("pubmed_refcount", "int"), |
|||
("standard_class", "str"), |
|||
("inchikey", "str"), |
|||
("inchikey14", "str"), |
|||
|
|||
("final_adduct", "str"), |
|||
("adduct", "str"), |
|||
("detected_adducts", "str"), |
|||
("adduct_calc_mz", "str"), |
|||
("msms_detected", "yesno"), |
|||
("msms_purity", "float"), |
|||
] |
|||
|
|||
_query_fields = [ |
|||
("rt_min", "float"), |
|||
("rt_max", "float"), |
|||
|
|||
("mz_min", "float"), |
|||
("mz_max", "float"), |
|||
|
|||
# ("year_max", "int"), |
|||
# ("day_max", "int"), |
|||
# ("month_max", "int"), |
|||
] |
|||
|
|||
|
|||
def _validate_type(field: str, value: str, t): |
|||
if t == "yesno": |
|||
l = value.strip().lower() |
|||
if l == "yes": |
|||
return True |
|||
elif l == "no": |
|||
return False |
|||
else: |
|||
raise ValueError( |
|||
f"Yes/No field {field} does not have a valid value {value}") |
|||
elif t == "int": |
|||
try: |
|||
return int(value) |
|||
except ValueError: |
|||
raise ValueError( |
|||
f"Integer field {field} does not have a valid value {value}") |
|||
elif t == "float": |
|||
try: |
|||
return float(value) |
|||
except ValueError: |
|||
raise ValueError( |
|||
f"Float field {field} does not have a valid value {value}") |
|||
elif t == "str": |
|||
return value |
|||
else: |
|||
raise ValueError("Impossible") |
|||
|
|||
|
|||
def validate_insertion_csv_fields(reader: csv.DictReader) -> tuple[list[dict], str]: |
|||
chemicals: list[dict] = [] |
|||
for row in reader: |
|||
chemical = {} |
|||
for field, t in _required_fields: |
|||
if field not in row: |
|||
return [], f"Required field \"{field}\" not present in csv" |
|||
try: |
|||
value = _validate_type(field, row[field], t) |
|||
chemical[field] = value |
|||
except ValueError as e: |
|||
return [], str(e) |
|||
|
|||
for field, t in _optional_fields: |
|||
if field not in row: |
|||
continue |
|||
try: |
|||
value = _validate_type(field, row[field], t) |
|||
chemical[field] = value |
|||
except ValueError as e: |
|||
return [], str(e) |
|||
chemicals.append(chemical) |
|||
return chemicals, "" |
|||
|
|||
|
|||
def validate_query_csv_fields(reader: csv.DictReader) -> tuple[list[dict], str]: |
|||
queries: list[dict] = [] |
|||
for row in reader: |
|||
query = {} |
|||
for field, t in _query_fields: |
|||
if field not in row: |
|||
return [], f"Required field \"{field}\" not present in csv" |
|||
try: |
|||
value = _validate_type(field, row[field], t) |
|||
query[field] = value |
|||
except ValueError as e: |
|||
return [], str(e) |
|||
|
|||
# year_max, month_max, day_max = query.get( |
|||
# 'year_max'), query.get('month_max'), query.get('day_max') |
|||
# try: |
|||
# d = date(year_max, month_max, day_max) |
|||
# query["date"] = d |
|||
# except ValueError as e: |
|||
# return [], f"Invalid Date Value Provided for {month_max}/{day_max}/{year_max}" |
|||
queries.append(query) |
|||
return queries, "" |
Write
Preview
Loading…
Cancel
Save
Reference in new issue