├── gis
    ├── biolok_stn_locs.cpg
    ├── biolok_stn_locs2.CPG
    ├── forsuringsregionene.cpg
    ├── biolok_stn_locs_update_2024-12-23.cpg
    ├── site_locs.mxd
    ├── site_locs.png
    ├── biolok_stn_locs.dbf
    ├── biolok_stn_locs.sbn
    ├── biolok_stn_locs.sbx
    ├── biolok_stn_locs.shp
    ├── biolok_stn_locs.shx
    ├── biolok_stn_locs2.dbf
    ├── biolok_stn_locs2.sbn
    ├── biolok_stn_locs2.sbx
    ├── biolok_stn_locs2.shp
    ├── biolok_stn_locs2.shx
    ├── forsuringsregionene.dbf
    ├── forsuringsregionene.sbn
    ├── forsuringsregionene.sbx
    ├── forsuringsregionene.shp
    ├── forsuringsregionene.shx
    ├── site_locs_2021-08-06.png
    ├── site_locs_2025-01-01.png
    ├── biolok_stn_locs_update_2024-12-23.dbf
    ├── biolok_stn_locs_update_2024-12-23.sbn
    ├── biolok_stn_locs_update_2024-12-23.sbx
    ├── biolok_stn_locs_update_2024-12-23.shp
    ├── biolok_stn_locs_update_2024-12-23.shx
    ├── biolok_stn_locs.prj
    ├── biolok_stn_locs2.prj
    ├── biolok_stn_locs_update_2024-12-23.prj
    └── forsuringsregionene.prj
├── README.md
├── .gitattributes
├── station_locs.xlsx
├── biolok_data_2020-08-21.xlsx
├── biolok_data_2020-09-02.xlsx
├── project_overview_from_lbs.xlsx
├── station_locs_update_2024-12-23.xlsx
├── water_samples_to_add_2020-08-21.xlsx
├── notebooks
    ├── region_plots
    │   ├── water_chem_ts_region_i.png
    │   ├── water_chem_ts_region_ii.png
    │   ├── water_chem_ts_region_iii.png
    │   ├── water_chem_ts_region_iv.png
    │   ├── water_chem_ts_region_ix.png
    │   ├── water_chem_ts_region_v.png
    │   ├── water_chem_ts_region_vi.png
    │   ├── water_chem_ts_region_vii.png
    │   ├── water_chem_ts_region_x.png
    │   └── water_chem_ts_region_viii.png
    ├── regional_mk_trends.csv
    ├── biolok_figures_2018_report.ipynb
    └── update_db_2018_report.ipynb
└── .gitignore


/gis/biolok_stn_locs.cpg:
--------------------------------------------------------------------------------
1 | UTF-8


--------------------------------------------------------------------------------
/gis/biolok_stn_locs2.CPG:
--------------------------------------------------------------------------------
1 | UTF-8


--------------------------------------------------------------------------------
/gis/forsuringsregionene.cpg:
--------------------------------------------------------------------------------
1 | ANSI 1252


--------------------------------------------------------------------------------
/gis/biolok_stn_locs_update_2024-12-23.cpg:
--------------------------------------------------------------------------------
1 | UTF-8


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
1 | # Biolok
2 | 
3 | Data management for the Biolok project.
4 | 


--------------------------------------------------------------------------------
/.gitattributes:
--------------------------------------------------------------------------------
1 | # Auto detect text files and perform LF normalization
2 | * text=auto
3 | 


--------------------------------------------------------------------------------
/gis/site_locs.mxd:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/site_locs.mxd


--------------------------------------------------------------------------------
/gis/site_locs.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/site_locs.png


--------------------------------------------------------------------------------
/station_locs.xlsx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/station_locs.xlsx


--------------------------------------------------------------------------------
/gis/biolok_stn_locs.dbf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs.dbf


--------------------------------------------------------------------------------
/gis/biolok_stn_locs.sbn:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs.sbn


--------------------------------------------------------------------------------
/gis/biolok_stn_locs.sbx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs.sbx


--------------------------------------------------------------------------------
/gis/biolok_stn_locs.shp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs.shp


--------------------------------------------------------------------------------
/gis/biolok_stn_locs.shx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs.shx


--------------------------------------------------------------------------------
/gis/biolok_stn_locs2.dbf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs2.dbf


--------------------------------------------------------------------------------
/gis/biolok_stn_locs2.sbn:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs2.sbn


--------------------------------------------------------------------------------
/gis/biolok_stn_locs2.sbx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs2.sbx


--------------------------------------------------------------------------------
/gis/biolok_stn_locs2.shp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs2.shp


--------------------------------------------------------------------------------
/gis/biolok_stn_locs2.shx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs2.shx


--------------------------------------------------------------------------------
/biolok_data_2020-08-21.xlsx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/biolok_data_2020-08-21.xlsx


--------------------------------------------------------------------------------
/biolok_data_2020-09-02.xlsx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/biolok_data_2020-09-02.xlsx


--------------------------------------------------------------------------------
/gis/forsuringsregionene.dbf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/forsuringsregionene.dbf


--------------------------------------------------------------------------------
/gis/forsuringsregionene.sbn:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/forsuringsregionene.sbn


--------------------------------------------------------------------------------
/gis/forsuringsregionene.sbx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/forsuringsregionene.sbx


--------------------------------------------------------------------------------
/gis/forsuringsregionene.shp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/forsuringsregionene.shp


--------------------------------------------------------------------------------
/gis/forsuringsregionene.shx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/forsuringsregionene.shx


--------------------------------------------------------------------------------
/gis/site_locs_2021-08-06.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/site_locs_2021-08-06.png


--------------------------------------------------------------------------------
/gis/site_locs_2025-01-01.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/site_locs_2025-01-01.png


--------------------------------------------------------------------------------
/project_overview_from_lbs.xlsx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/project_overview_from_lbs.xlsx


--------------------------------------------------------------------------------
/station_locs_update_2024-12-23.xlsx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/station_locs_update_2024-12-23.xlsx


--------------------------------------------------------------------------------
/water_samples_to_add_2020-08-21.xlsx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/water_samples_to_add_2020-08-21.xlsx


--------------------------------------------------------------------------------
/gis/biolok_stn_locs_update_2024-12-23.dbf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs_update_2024-12-23.dbf


--------------------------------------------------------------------------------
/gis/biolok_stn_locs_update_2024-12-23.sbn:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs_update_2024-12-23.sbn


--------------------------------------------------------------------------------
/gis/biolok_stn_locs_update_2024-12-23.sbx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs_update_2024-12-23.sbx


--------------------------------------------------------------------------------
/gis/biolok_stn_locs_update_2024-12-23.shp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs_update_2024-12-23.shp


--------------------------------------------------------------------------------
/gis/biolok_stn_locs_update_2024-12-23.shx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/gis/biolok_stn_locs_update_2024-12-23.shx


--------------------------------------------------------------------------------
/notebooks/region_plots/water_chem_ts_region_i.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/notebooks/region_plots/water_chem_ts_region_i.png


--------------------------------------------------------------------------------
/notebooks/region_plots/water_chem_ts_region_ii.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/notebooks/region_plots/water_chem_ts_region_ii.png


--------------------------------------------------------------------------------
/notebooks/region_plots/water_chem_ts_region_iii.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/notebooks/region_plots/water_chem_ts_region_iii.png


--------------------------------------------------------------------------------
/notebooks/region_plots/water_chem_ts_region_iv.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/notebooks/region_plots/water_chem_ts_region_iv.png


--------------------------------------------------------------------------------
/notebooks/region_plots/water_chem_ts_region_ix.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/notebooks/region_plots/water_chem_ts_region_ix.png


--------------------------------------------------------------------------------
/notebooks/region_plots/water_chem_ts_region_v.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/notebooks/region_plots/water_chem_ts_region_v.png


--------------------------------------------------------------------------------
/notebooks/region_plots/water_chem_ts_region_vi.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/notebooks/region_plots/water_chem_ts_region_vi.png


--------------------------------------------------------------------------------
/notebooks/region_plots/water_chem_ts_region_vii.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/notebooks/region_plots/water_chem_ts_region_vii.png


--------------------------------------------------------------------------------
/notebooks/region_plots/water_chem_ts_region_x.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/notebooks/region_plots/water_chem_ts_region_x.png


--------------------------------------------------------------------------------
/notebooks/region_plots/water_chem_ts_region_viii.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/JamesSample/biolok/master/notebooks/region_plots/water_chem_ts_region_viii.png


--------------------------------------------------------------------------------
/gis/biolok_stn_locs.prj:
--------------------------------------------------------------------------------
1 | GEOGCS["GCS_WGS_1984",DATUM["D_WGS_1984",SPHEROID["WGS_1984",6378137.0,298.257223563]],PRIMEM["Greenwich",0.0],UNIT["Degree",0.0174532925199433]]


--------------------------------------------------------------------------------
/gis/biolok_stn_locs2.prj:
--------------------------------------------------------------------------------
1 | GEOGCS["GCS_WGS_1984",DATUM["D_WGS_1984",SPHEROID["WGS_1984",6378137.0,298.257223563]],PRIMEM["Greenwich",0.0],UNIT["Degree",0.0174532925199433]]


--------------------------------------------------------------------------------
/gis/biolok_stn_locs_update_2024-12-23.prj:
--------------------------------------------------------------------------------
1 | GEOGCS["GCS_WGS_1984",DATUM["D_WGS_1984",SPHEROID["WGS_1984",6378137.0,298.257223563]],PRIMEM["Greenwich",0.0],UNIT["Degree",0.0174532925199433]]


--------------------------------------------------------------------------------
/gis/forsuringsregionene.prj:
--------------------------------------------------------------------------------
1 | PROJCS["WGS_1984_UTM_Zone_33N",GEOGCS["GCS_WGS_1984",DATUM["D_WGS_1984",SPHEROID["WGS_1984",6378137.0,298.257223563]],PRIMEM["Greenwich",0.0],UNIT["Degree",0.0174532925199433]],PROJECTION["Transverse_Mercator"],PARAMETER["False_Easting",500000.0],PARAMETER["False_Northing",0.0],PARAMETER["Central_Meridian",15.0],PARAMETER["Scale_Factor",0.9996],PARAMETER["Latitude_Of_Origin",0.0],UNIT["Meter",1.0]]


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | 
  6 | # C extensions
  7 | *.so
  8 | 
  9 | # Distribution / packaging
 10 | .Python
 11 | build/
 12 | develop-eggs/
 13 | dist/
 14 | downloads/
 15 | eggs/
 16 | .eggs/
 17 | lib/
 18 | lib64/
 19 | parts/
 20 | sdist/
 21 | var/
 22 | wheels/
 23 | pip-wheel-metadata/
 24 | share/python-wheels/
 25 | *.egg-info/
 26 | .installed.cfg
 27 | *.egg
 28 | MANIFEST
 29 | 
 30 | # PyInstaller
 31 | #  Usually these files are written by a python script from a template
 32 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 33 | *.manifest
 34 | *.spec
 35 | 
 36 | # Installer logs
 37 | pip-log.txt
 38 | pip-delete-this-directory.txt
 39 | 
 40 | # Unit test / coverage reports
 41 | htmlcov/
 42 | .tox/
 43 | .nox/
 44 | .coverage
 45 | .coverage.*
 46 | .cache
 47 | nosetests.xml
 48 | coverage.xml
 49 | *.cover
 50 | *.py,cover
 51 | .hypothesis/
 52 | .pytest_cache/
 53 | 
 54 | # Translations
 55 | *.mo
 56 | *.pot
 57 | 
 58 | # Django stuff:
 59 | *.log
 60 | local_settings.py
 61 | db.sqlite3
 62 | db.sqlite3-journal
 63 | 
 64 | # Flask stuff:
 65 | instance/
 66 | .webassets-cache
 67 | 
 68 | # Scrapy stuff:
 69 | .scrapy
 70 | 
 71 | # Sphinx documentation
 72 | docs/_build/
 73 | 
 74 | # PyBuilder
 75 | target/
 76 | 
 77 | # Jupyter Notebook
 78 | .ipynb_checkpoints
 79 | 
 80 | # IPython
 81 | profile_default/
 82 | ipython_config.py
 83 | 
 84 | # pyenv
 85 | .python-version
 86 | 
 87 | # pipenv
 88 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 89 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 90 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 91 | #   install all needed dependencies.
 92 | #Pipfile.lock
 93 | 
 94 | # celery beat schedule file
 95 | celerybeat-schedule
 96 | 
 97 | # SageMath parsed files
 98 | *.sage.py
 99 | 
100 | # Environments
101 | .env
102 | .venv
103 | env/
104 | venv/
105 | ENV/
106 | env.bak/
107 | venv.bak/
108 | 
109 | # Spyder project settings
110 | .spyderproject
111 | .spyproject
112 | 
113 | # Rope project settings
114 | .ropeproject
115 | 
116 | # mkdocs documentation
117 | /site
118 | 
119 | # mypy
120 | .mypy_cache/
121 | .dmypy.json
122 | dmypy.json
123 | 
124 | # Pyre type checker
125 | .pyre/
126 | 


--------------------------------------------------------------------------------
/notebooks/regional_mk_trends.csv:
--------------------------------------------------------------------------------
 1 | region,parameter,s,z,var_s,p,sslp,trend
 2 | I,ESO4_uekv/l,-991.0,-11.63525509403131,7239.666666666666,0.0,-0.8412699999999997,decreasing
 3 | I,ECa-Mg_uekv/l,-60.0,-0.6933663075078519,7240.666666666666,0.48807970071388085,-0.04429083333333361,no trend
 4 | I,ANC_uekv/l,705.0,8.27281655005634,7241.666666666666,2.220446049250313e-16,1.1235575000000004,increasing
 5 | I,pH,657.0,7.7133778580770835,7232.999999999999,1.2212453270876722e-14,0.015263157894736845,increasing
 6 | I,LAL_ug/l,-8.0,-0.08264130673512297,7174.666666666667,0.9341367555671447,0.0,no trend
 7 | I,TOC_mg-C/l,387.0,4.545792767979856,7210.333333333333,5.4728864435915625e-06,0.026666666666666648,increasing
 8 | IV,ESO4_uekv/l,-1679.0,-14.151564147572177,14059.666666666666,0.0,-2.06651,decreasing
 9 | IV,ECa-Mg_uekv/l,-711.0,-5.987848953978692,14059.666666666666,2.1263439897722947e-09,-0.5111227564102564,decreasing
10 | IV,ANC_uekv/l,1315.0,11.081737359898593,14059.666666666666,0.0,1.9401192857142857,increasing
11 | IV,pH,1137.0,9.586697014296265,14041.666666666666,0.0,0.021764705882353,increasing
12 | IV,LAL_ug/l,-1066.0,-8.985502275273886,14048.000000000002,0.0,-2.6666666666666665,decreasing
13 | IV,TOC_mg-C/l,981.0,8.270606652674687,14040.333333333334,2.220446049250313e-16,0.0918181818181818,increasing
14 | II,ESO4_uekv/l,-2320.0,-16.069846166706817,20824.666666666664,0.0,-2.2696648263888886,decreasing
15 | II,ECa-Mg_uekv/l,-1546.0,-10.705787053760268,20826.666666666664,0.0,-0.8966040760389037,decreasing
16 | II,ANC_uekv/l,1788.0,12.382680559915599,20826.666666666664,0.0,1.7542065614035092,increasing
17 | II,pH,1279.0,8.859702987302262,20807.666666666664,0.0,0.01428571428571431,increasing
18 | II,LAL_ug/l,-1201.0,-8.320436273483097,20800.333333333332,0.0,-2.0000000000000004,decreasing
19 | II,TOC_mg-C/l,1113.0,7.711259617325164,20795.0,1.2434497875801753e-14,0.08614814814814814,increasing
20 | X,ESO4_uekv/l,-720.0,-8.666635310745093,6882.666666666667,0.0,-1.3306742663043472,decreasing
21 | X,ECa-Mg_uekv/l,54.0,0.6388479436293324,6882.666666666667,0.522921855509767,0.0802303846153839,no trend
22 | X,ANC_uekv/l,700.0,8.425560615035911,6882.666666666667,0.0,1.9263091125541125,increasing
23 | X,pH,693.0,8.348667986226507,6870.333333333334,0.0,0.020000000000000316,increasing
24 | X,LAL_ug/l,14.0,0.16038386220948114,6569.999999999999,0.8725787011511899,0.0,no trend
25 | X,TOC_mg-C/l,321.0,3.8745917870024393,6821.0,0.00010680358242098897,0.013137254901960767,increasing
26 | V,ESO4_uekv/l,-1374.0,-12.677147142636008,11730.0,0.0,-1.6488776,decreasing
27 | V,ECa-Mg_uekv/l,-520.0,-4.792017018957092,11730.0,1.6511289293585918e-06,-0.3514439999999999,decreasing
28 | V,ANC_uekv/l,978.0,9.020810457651406,11730.0,0.0,1.8899920000000001,increasing
29 | V,pH,998.0,9.211234385281168,11715.333333333332,0.0,0.021568627450980368,increasing
30 | V,LAL_ug/l,-899.0,-8.295752124677072,11717.666666666666,0.0,-2.833333333333334,decreasing
31 | V,TOC_mg-C/l,950.0,8.77200874309453,11704.0,0.0,0.03611111111111106,increasing
32 | III,ESO4_uekv/l,-671.0,-9.23720648536655,5261.0,0.0,-0.8624024747474749,decreasing
33 | III,ECa-Mg_uekv/l,-87.0,-1.1856712802112288,5261.0,0.23575214060493388,-0.10593597222222106,no trend
34 | III,ANC_uekv/l,524.0,7.209850624536281,5262.0,5.60218538225854e-13,1.0438662037037039,increasing
35 | III,pH,490.0,6.743705065232814,5258.0,1.5439871603462052e-11,0.023333333333333428,increasing
36 | III,LAL_ug/l,-208.0,-2.866900355272018,5213.333333333333,0.004145135015002799,-0.14068825910931176,decreasing
37 | III,TOC_mg-C/l,324.0,4.454430953108791,5258.0,8.411599311086704e-06,0.010350877192982456,increasing
38 | VII,ESO4_uekv/l,-1209.0,-11.506849504471477,11021.0,0.0,-0.42436677419354835,decreasing
39 | VII,ECa-Mg_uekv/l,16.0,0.1428765831706107,11022.0,0.8863876527344121,0.002630833333333508,no trend
40 | VII,ANC_uekv/l,941.0,8.953193070217464,11023.0,0.0,0.6463140350877193,increasing
41 | VII,pH,1020.0,9.70960690839739,11014.0,0.0,0.018888888888888882,increasing
42 | VII,LAL_ug/l,-588.0,-5.6032813815041465,10974.666666666668,2.1033135677583914e-08,-0.3333333333333333,decreasing
43 | VII,TOC_mg-C/l,60.0,0.562389569590987,11006.0,0.5738506240062637,0.0010256410256410321,no trend
44 | VI,ESO4_uekv/l,-892.0,-9.708517041764388,8422.666666666666,0.0,-0.906736,decreasing
45 | VI,ECa-Mg_uekv/l,-150.0,-1.6235342752221031,8422.666666666666,0.10447524250493267,-0.10405453081232498,no trend
46 | VI,ANC_uekv/l,704.0,7.660030842155292,8422.666666666666,1.865174681370263e-14,1.116824431818182,increasing
47 | VI,pH,730.0,7.945218977030653,8418.666666666666,1.9984014443252818e-15,0.026904761904761924,increasing
48 | VI,LAL_ug/l,-651.0,-7.09391144746038,8395.666666666666,1.3038459201197838e-12,-1.5,decreasing
49 | VI,TOC_mg-C/l,565.0,6.155332394411776,8395.666666666666,7.492018117005728e-10,0.020875,increasing
50 | IX,ESO4_uekv/l,-34.0,-0.9964984287699772,1096.6666666666667,0.3190080301151297,-0.0524026362179487,no trend
51 | IX,ECa-Mg_uekv/l,90.0,2.6875260654705446,1096.6666666666667,0.007198348391553422,0.43646352083333295,increasing
52 | IX,ANC_uekv/l,90.0,2.6875260654705446,1096.6666666666667,0.007198348391553422,0.4849736499999999,increasing
53 | IX,pH,66.0,1.964592174394741,1094.6666666666667,0.049461458439756134,0.005634920634920839,increasing
54 | IX,LAL_ug/l,87.0,2.6092572470734536,1086.3333333333333,0.009073900073062857,0.18181818181818182,increasing
55 | IX,TOC_mg-C/l,41.0,1.2084279640112776,1095.6666666666667,0.22688268885268403,0.0032539682539682365,no trend
56 | VIII,ESO4_uekv/l,-469.0,-5.204392390329606,8086.333333333334,1.9463236622385693e-07,-0.20392529411764707,decreasing
57 | VIII,ECa-Mg_uekv/l,265.0,2.9346016451584553,8093.0,0.003339761465631419,0.20926399999999973,increasing
58 | VIII,ANC_uekv/l,613.0,6.802940177412783,8093.0,1.0250467141759145e-11,0.7292633333333335,increasing
59 | VIII,pH,397.0,4.403716637971206,8086.333333333333,1.0641191712457143e-05,0.009230769230769239,increasing
60 | VIII,LAL_ug/l,289.0,3.273502341364007,7740.333333333334,0.001062235106070064,0.03333333333333333,increasing
61 | VIII,TOC_mg-C/l,196.0,2.170421259572428,8072.0,0.029974947708887534,0.004700000000000002,increasing
62 | 


--------------------------------------------------------------------------------
/notebooks/biolok_figures_2018_report.ipynb:
--------------------------------------------------------------------------------
   1 | {
   2 |  "cells": [
   3 |   {
   4 |    "cell_type": "code",
   5 |    "execution_count": 1,
   6 |    "metadata": {},
   7 |    "outputs": [],
   8 |    "source": [
   9 |     "%matplotlib inline\n",
  10 |     "\n",
  11 |     "import datetime as dt\n",
  12 |     "\n",
  13 |     "import matplotlib.pyplot as plt\n",
  14 |     "import numpy as np\n",
  15 |     "import pandas as pd\n",
  16 |     "import seaborn as sn\n",
  17 |     "\n",
  18 |     "import nivapy3 as nivapy\n",
  19 |     "\n",
  20 |     "plt.style.use(\"ggplot\")"
  21 |    ]
  22 |   },
  23 |   {
  24 |    "cell_type": "markdown",
  25 |    "metadata": {},
  26 |    "source": [
  27 |     "# Biolok data analysis"
  28 |    ]
  29 |   },
  30 |   {
  31 |    "cell_type": "markdown",
  32 |    "metadata": {},
  33 |    "source": [
  34 |     "## 1. Figures for the 2018 report\n",
  35 |     "\n",
  36 |     "With help from Liv Bente, I have created a new \"dataset\" named `BIOLOK rapp2018`, which is accessible under `Datasets` in RESA's `Projects` window. The steps to create this dataset are described in *update_db_2018_report.ipynb*.\n",
  37 |     "\n",
  38 |     "To export the relevant data from RESA2, select the dataset and remember to check `Use only water samples from selected projects` before extracting the data.\n",
  39 |     "\n",
  40 |     "Øyvind would like a set of plots similar to the ones on pages 29 - 38 [here](https://www.miljodirektoratet.no/globalassets/publikasjoner/m503/m503.pdf) (see e-mail received 17.08.2020 at 15:34.\n",
  41 |     "\n",
  42 |     "For now, I have manually extracted the relevant data from RESA and saved it to \n",
  43 |     "\n",
  44 |     "    biolok\\biolok_data_2020-08-21.xlsx"
  45 |    ]
  46 |   },
  47 |   {
  48 |    "cell_type": "code",
  49 |    "execution_count": 2,
  50 |    "metadata": {},
  51 |    "outputs": [
  52 |     {
  53 |      "data": {
  54 |       "text/html": [
  55 |        "<div>\n",
  56 |        "<style scoped>\n",
  57 |        "    .dataframe tbody tr th:only-of-type {\n",
  58 |        "        vertical-align: middle;\n",
  59 |        "    }\n",
  60 |        "\n",
  61 |        "    .dataframe tbody tr th {\n",
  62 |        "        vertical-align: top;\n",
  63 |        "    }\n",
  64 |        "\n",
  65 |        "    .dataframe thead th {\n",
  66 |        "        text-align: right;\n",
  67 |        "    }\n",
  68 |        "</style>\n",
  69 |        "<table border=\"1\" class=\"dataframe\">\n",
  70 |        "  <thead>\n",
  71 |        "    <tr style=\"text-align: right;\">\n",
  72 |        "      <th></th>\n",
  73 |        "      <th>station_id</th>\n",
  74 |        "      <th>station_code</th>\n",
  75 |        "      <th>biolok_code</th>\n",
  76 |        "      <th>station_name</th>\n",
  77 |        "      <th>date</th>\n",
  78 |        "      <th>depth1</th>\n",
  79 |        "      <th>depth2</th>\n",
  80 |        "      <th>ESO4_uekv/l</th>\n",
  81 |        "      <th>ANC_uekv/l</th>\n",
  82 |        "      <th>pH</th>\n",
  83 |        "      <th>LAL_ug/l</th>\n",
  84 |        "      <th>TOC_mg-C/l</th>\n",
  85 |        "      <th>ECa-Mg_uekv/l</th>\n",
  86 |        "      <th>region</th>\n",
  87 |        "      <th>site_no</th>\n",
  88 |        "      <th>year</th>\n",
  89 |        "    </tr>\n",
  90 |        "  </thead>\n",
  91 |        "  <tbody>\n",
  92 |        "    <tr>\n",
  93 |        "      <th>0</th>\n",
  94 |        "      <td>14</td>\n",
  95 |        "      <td>432-1-26</td>\n",
  96 |        "      <td>I-3</td>\n",
  97 |        "      <td>Måsabutjørna</td>\n",
  98 |        "      <td>1995-09-20</td>\n",
  99 |        "      <td>0.0</td>\n",
 100 |        "      <td>0.0</td>\n",
 101 |        "      <td>38.68637</td>\n",
 102 |        "      <td>6.63334</td>\n",
 103 |        "      <td>5.68</td>\n",
 104 |        "      <td>0.0</td>\n",
 105 |        "      <td>1.6</td>\n",
 106 |        "      <td>26.03949</td>\n",
 107 |        "      <td>I</td>\n",
 108 |        "      <td>3</td>\n",
 109 |        "      <td>1995</td>\n",
 110 |        "    </tr>\n",
 111 |        "    <tr>\n",
 112 |        "      <th>1</th>\n",
 113 |        "      <td>14</td>\n",
 114 |        "      <td>432-1-26</td>\n",
 115 |        "      <td>I-3</td>\n",
 116 |        "      <td>Måsabutjørna</td>\n",
 117 |        "      <td>1996-10-10</td>\n",
 118 |        "      <td>0.0</td>\n",
 119 |        "      <td>0.0</td>\n",
 120 |        "      <td>36.31385</td>\n",
 121 |        "      <td>3.69217</td>\n",
 122 |        "      <td>5.73</td>\n",
 123 |        "      <td>0.0</td>\n",
 124 |        "      <td>1.9</td>\n",
 125 |        "      <td>24.88327</td>\n",
 126 |        "      <td>I</td>\n",
 127 |        "      <td>3</td>\n",
 128 |        "      <td>1996</td>\n",
 129 |        "    </tr>\n",
 130 |        "    <tr>\n",
 131 |        "      <th>2</th>\n",
 132 |        "      <td>14</td>\n",
 133 |        "      <td>432-1-26</td>\n",
 134 |        "      <td>I-3</td>\n",
 135 |        "      <td>Måsabutjørna</td>\n",
 136 |        "      <td>1997-10-26</td>\n",
 137 |        "      <td>0.0</td>\n",
 138 |        "      <td>0.0</td>\n",
 139 |        "      <td>36.02333</td>\n",
 140 |        "      <td>6.46292</td>\n",
 141 |        "      <td>5.70</td>\n",
 142 |        "      <td>9.0</td>\n",
 143 |        "      <td>1.5</td>\n",
 144 |        "      <td>27.71908</td>\n",
 145 |        "      <td>I</td>\n",
 146 |        "      <td>3</td>\n",
 147 |        "      <td>1997</td>\n",
 148 |        "    </tr>\n",
 149 |        "    <tr>\n",
 150 |        "      <th>3</th>\n",
 151 |        "      <td>14</td>\n",
 152 |        "      <td>432-1-26</td>\n",
 153 |        "      <td>I-3</td>\n",
 154 |        "      <td>Måsabutjørna</td>\n",
 155 |        "      <td>1998-07-06</td>\n",
 156 |        "      <td>0.0</td>\n",
 157 |        "      <td>0.0</td>\n",
 158 |        "      <td>30.06786</td>\n",
 159 |        "      <td>5.48708</td>\n",
 160 |        "      <td>5.78</td>\n",
 161 |        "      <td>2.0</td>\n",
 162 |        "      <td>1.7</td>\n",
 163 |        "      <td>21.91635</td>\n",
 164 |        "      <td>I</td>\n",
 165 |        "      <td>3</td>\n",
 166 |        "      <td>1998</td>\n",
 167 |        "    </tr>\n",
 168 |        "    <tr>\n",
 169 |        "      <th>4</th>\n",
 170 |        "      <td>14</td>\n",
 171 |        "      <td>432-1-26</td>\n",
 172 |        "      <td>I-3</td>\n",
 173 |        "      <td>Måsabutjørna</td>\n",
 174 |        "      <td>1998-09-15</td>\n",
 175 |        "      <td>0.0</td>\n",
 176 |        "      <td>0.0</td>\n",
 177 |        "      <td>32.14986</td>\n",
 178 |        "      <td>4.58344</td>\n",
 179 |        "      <td>5.93</td>\n",
 180 |        "      <td>2.0</td>\n",
 181 |        "      <td>1.7</td>\n",
 182 |        "      <td>22.23999</td>\n",
 183 |        "      <td>I</td>\n",
 184 |        "      <td>3</td>\n",
 185 |        "      <td>1998</td>\n",
 186 |        "    </tr>\n",
 187 |        "  </tbody>\n",
 188 |        "</table>\n",
 189 |        "</div>"
 190 |       ],
 191 |       "text/plain": [
 192 |        "   station_id station_code biolok_code  station_name       date  depth1  \\\n",
 193 |        "0          14     432-1-26         I-3  Måsabutjørna 1995-09-20     0.0   \n",
 194 |        "1          14     432-1-26         I-3  Måsabutjørna 1996-10-10     0.0   \n",
 195 |        "2          14     432-1-26         I-3  Måsabutjørna 1997-10-26     0.0   \n",
 196 |        "3          14     432-1-26         I-3  Måsabutjørna 1998-07-06     0.0   \n",
 197 |        "4          14     432-1-26         I-3  Måsabutjørna 1998-09-15     0.0   \n",
 198 |        "\n",
 199 |        "   depth2  ESO4_uekv/l  ANC_uekv/l    pH  LAL_ug/l  TOC_mg-C/l  ECa-Mg_uekv/l  \\\n",
 200 |        "0     0.0     38.68637     6.63334  5.68       0.0         1.6       26.03949   \n",
 201 |        "1     0.0     36.31385     3.69217  5.73       0.0         1.9       24.88327   \n",
 202 |        "2     0.0     36.02333     6.46292  5.70       9.0         1.5       27.71908   \n",
 203 |        "3     0.0     30.06786     5.48708  5.78       2.0         1.7       21.91635   \n",
 204 |        "4     0.0     32.14986     4.58344  5.93       2.0         1.7       22.23999   \n",
 205 |        "\n",
 206 |        "  region site_no  year  \n",
 207 |        "0      I       3  1995  \n",
 208 |        "1      I       3  1996  \n",
 209 |        "2      I       3  1997  \n",
 210 |        "3      I       3  1998  \n",
 211 |        "4      I       3  1998  "
 212 |       ]
 213 |      },
 214 |      "execution_count": 2,
 215 |      "metadata": {},
 216 |      "output_type": "execute_result"
 217 |     }
 218 |    ],
 219 |    "source": [
 220 |     "# Read data\n",
 221 |     "df = pd.read_excel(\"../biolok_data_2020-08-21.xlsx\", sheet_name=\"data\")\n",
 222 |     "\n",
 223 |     "# Replace neagtive LAL with 0\n",
 224 |     "df[\"LAL_ug/l\"] = df[\"LAL_ug/l\"].clip(lower=0)\n",
 225 |     "\n",
 226 |     "# Add Ca and Mg\n",
 227 |     "df[\"ECa-Mg_uekv/l\"] = df[\"EMg_uekv/l\"] + df[\"ECa_uekv/l\"]\n",
 228 |     "del df[\"EMg_uekv/l\"], df[\"ECa_uekv/l\"]\n",
 229 |     "\n",
 230 |     "# Get region and site number\n",
 231 |     "df[[\"region\", \"site_no\"]] = df[\"biolok_code\"].str.split(\"-\", expand=True)\n",
 232 |     "\n",
 233 |     "df[\"year\"] = df[\"date\"].dt.year\n",
 234 |     "\n",
 235 |     "df.head()"
 236 |    ]
 237 |   },
 238 |   {
 239 |    "cell_type": "code",
 240 |    "execution_count": 3,
 241 |    "metadata": {},
 242 |    "outputs": [],
 243 |    "source": [
 244 |     "# Annual means by station\n",
 245 |     "agg = df.groupby([\"station_name\", \"year\", \"region\"]).mean().reset_index()\n",
 246 |     "del agg[\"station_id\"], agg[\"depth1\"], agg[\"depth2\"]"
 247 |    ]
 248 |   },
 249 |   {
 250 |    "cell_type": "code",
 251 |    "execution_count": 4,
 252 |    "metadata": {},
 253 |    "outputs": [],
 254 |    "source": [
 255 |     "label_dict = {\n",
 256 |     "    \"ESO4_uekv/l\": \"Ikke-marin $SO_4$ (µekv/l)\",\n",
 257 |     "    \"ECa-Mg_uekv/l\": \"Ikke-marin Ca+Mg (µekv/l)\",\n",
 258 |     "    \"ANC_uekv/l\": \"ANC (µekv/l)\",\n",
 259 |     "    \"pH\": \"pH\",\n",
 260 |     "    \"LAL_ug/l\": \"Labilt Al (µg/l)\",\n",
 261 |     "    \"TOC_mg-C/l\": \"TOC (mg C/l)\",\n",
 262 |     "}\n",
 263 |     "\n",
 264 |     "# Pars to plot\n",
 265 |     "pars = [\"ESO4_uekv/l\", \"ECa-Mg_uekv/l\", \"ANC_uekv/l\", \"pH\", \"LAL_ug/l\", \"TOC_mg-C/l\"]\n",
 266 |     "\n",
 267 |     "# Loop over regions\n",
 268 |     "for reg in agg[\"region\"].unique():\n",
 269 |     "    reg_df = agg.query(\"region == @reg\")\n",
 270 |     "    del reg_df[\"region\"]\n",
 271 |     "\n",
 272 |     "    # Setup plot\n",
 273 |     "    fig, axes = plt.subplots(nrows=2, ncols=3, figsize=(16, 9))\n",
 274 |     "    axes = axes.flatten()\n",
 275 |     "\n",
 276 |     "    # Loop over pars\n",
 277 |     "    #    max_list = []\n",
 278 |     "    for idx, par in enumerate(pars):\n",
 279 |     "        par_df = reg_df[[\"station_name\", \"year\", par]].copy()\n",
 280 |     "        par_df.set_index([\"station_name\", \"year\"], inplace=True)\n",
 281 |     "        par_df = par_df.unstack(\"station_name\")\n",
 282 |     "        par_df.columns = par_df.columns.get_level_values(1)\n",
 283 |     "\n",
 284 |     "        if len(par_df.columns) > 1:\n",
 285 |     "            par_df[\"Snitt\"] = par_df.mean(axis=1, skipna=False)\n",
 286 |     "\n",
 287 |     "        #        if par in [\"ESO4_uekv/l\", \"ECa-Mg_uekv/l\", \"ANC_uekv/l\"]:\n",
 288 |     "        #            max_list.append(np.nanmax(par_df.values))\n",
 289 |     "\n",
 290 |     "        # Plot each station\n",
 291 |     "        for stn in par_df.columns:\n",
 292 |     "            if stn == \"Snitt\":\n",
 293 |     "                par_df[stn].dropna().plot(ax=axes[idx], style=\"-\", lw=3, c=\"k\")\n",
 294 |     "            else:\n",
 295 |     "                par_df[stn].dropna().plot(ax=axes[idx], style=\"--\", lw=2)\n",
 296 |     "\n",
 297 |     "        #        if par == 'pH':\n",
 298 |     "        #            axes[idx].set_ylim((4, 7))\n",
 299 |     "        axes[idx].set_xlim((1985, 2020))\n",
 300 |     "        axes[idx].set_xlabel(\"\")\n",
 301 |     "        axes[idx].set_ylabel(label_dict[par])\n",
 302 |     "\n",
 303 |     "    #    for ax in [0, 1]:\n",
 304 |     "    #        axes[ax].set_ylim((0, max(max_list)))\n",
 305 |     "    #    axes[2].set_ylim(ymax=max(max_list))\n",
 306 |     "\n",
 307 |     "    axes[-1].legend(loc=\"upper center\", bbox_to_anchor=(0.5, -0.1), ncol=3)\n",
 308 |     "    plt.tight_layout()\n",
 309 |     "\n",
 310 |     "    out_png = f\"./region_plots/water_chem_ts_region_{reg.lower()}.png\"\n",
 311 |     "    plt.savefig(out_png, dpi=300)\n",
 312 |     "    plt.close()"
 313 |    ]
 314 |   },
 315 |   {
 316 |    "cell_type": "markdown",
 317 |    "metadata": {},
 318 |    "source": [
 319 |     "## 2. Regional Mann-Kendall"
 320 |    ]
 321 |   },
 322 |   {
 323 |    "cell_type": "code",
 324 |    "execution_count": 5,
 325 |    "metadata": {},
 326 |    "outputs": [
 327 |     {
 328 |      "name": "stdout",
 329 |      "output_type": "stream",
 330 |      "text": [
 331 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 332 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 333 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 334 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 335 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 336 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 337 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 338 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 339 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 340 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 341 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 342 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 343 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 344 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 345 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 346 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 347 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 348 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 349 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 350 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 351 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 352 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 353 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 354 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 355 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 356 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 357 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 358 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 359 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n",
 360 |       "WARNING: The data series has fewer than 10 non-null values. Significance estimates may be unreliable.\n"
 361 |      ]
 362 |     },
 363 |     {
 364 |      "data": {
 365 |       "text/html": [
 366 |        "<div>\n",
 367 |        "<style scoped>\n",
 368 |        "    .dataframe tbody tr th:only-of-type {\n",
 369 |        "        vertical-align: middle;\n",
 370 |        "    }\n",
 371 |        "\n",
 372 |        "    .dataframe tbody tr th {\n",
 373 |        "        vertical-align: top;\n",
 374 |        "    }\n",
 375 |        "\n",
 376 |        "    .dataframe thead th {\n",
 377 |        "        text-align: right;\n",
 378 |        "    }\n",
 379 |        "</style>\n",
 380 |        "<table border=\"1\" class=\"dataframe\">\n",
 381 |        "  <thead>\n",
 382 |        "    <tr style=\"text-align: right;\">\n",
 383 |        "      <th></th>\n",
 384 |        "      <th>region</th>\n",
 385 |        "      <th>parameter</th>\n",
 386 |        "      <th>s</th>\n",
 387 |        "      <th>z</th>\n",
 388 |        "      <th>var_s</th>\n",
 389 |        "      <th>p</th>\n",
 390 |        "      <th>sslp</th>\n",
 391 |        "      <th>trend</th>\n",
 392 |        "    </tr>\n",
 393 |        "  </thead>\n",
 394 |        "  <tbody>\n",
 395 |        "    <tr>\n",
 396 |        "      <th>0</th>\n",
 397 |        "      <td>I</td>\n",
 398 |        "      <td>ESO4_uekv/l</td>\n",
 399 |        "      <td>-991</td>\n",
 400 |        "      <td>-11.6353</td>\n",
 401 |        "      <td>7239.67</td>\n",
 402 |        "      <td>0</td>\n",
 403 |        "      <td>-0.84127</td>\n",
 404 |        "      <td>decreasing</td>\n",
 405 |        "    </tr>\n",
 406 |        "    <tr>\n",
 407 |        "      <th>1</th>\n",
 408 |        "      <td>I</td>\n",
 409 |        "      <td>ECa-Mg_uekv/l</td>\n",
 410 |        "      <td>-60</td>\n",
 411 |        "      <td>-0.693366</td>\n",
 412 |        "      <td>7240.67</td>\n",
 413 |        "      <td>0.48808</td>\n",
 414 |        "      <td>-0.0442908</td>\n",
 415 |        "      <td>no trend</td>\n",
 416 |        "    </tr>\n",
 417 |        "    <tr>\n",
 418 |        "      <th>2</th>\n",
 419 |        "      <td>I</td>\n",
 420 |        "      <td>ANC_uekv/l</td>\n",
 421 |        "      <td>705</td>\n",
 422 |        "      <td>8.27282</td>\n",
 423 |        "      <td>7241.67</td>\n",
 424 |        "      <td>2.22045e-16</td>\n",
 425 |        "      <td>1.12356</td>\n",
 426 |        "      <td>increasing</td>\n",
 427 |        "    </tr>\n",
 428 |        "    <tr>\n",
 429 |        "      <th>3</th>\n",
 430 |        "      <td>I</td>\n",
 431 |        "      <td>pH</td>\n",
 432 |        "      <td>657</td>\n",
 433 |        "      <td>7.71338</td>\n",
 434 |        "      <td>7233</td>\n",
 435 |        "      <td>1.22125e-14</td>\n",
 436 |        "      <td>0.0152632</td>\n",
 437 |        "      <td>increasing</td>\n",
 438 |        "    </tr>\n",
 439 |        "    <tr>\n",
 440 |        "      <th>4</th>\n",
 441 |        "      <td>I</td>\n",
 442 |        "      <td>LAL_ug/l</td>\n",
 443 |        "      <td>-8</td>\n",
 444 |        "      <td>-0.0826413</td>\n",
 445 |        "      <td>7174.67</td>\n",
 446 |        "      <td>0.934137</td>\n",
 447 |        "      <td>0</td>\n",
 448 |        "      <td>no trend</td>\n",
 449 |        "    </tr>\n",
 450 |        "    <tr>\n",
 451 |        "      <th>5</th>\n",
 452 |        "      <td>I</td>\n",
 453 |        "      <td>TOC_mg-C/l</td>\n",
 454 |        "      <td>387</td>\n",
 455 |        "      <td>4.54579</td>\n",
 456 |        "      <td>7210.33</td>\n",
 457 |        "      <td>5.47289e-06</td>\n",
 458 |        "      <td>0.0266667</td>\n",
 459 |        "      <td>increasing</td>\n",
 460 |        "    </tr>\n",
 461 |        "    <tr>\n",
 462 |        "      <th>6</th>\n",
 463 |        "      <td>IV</td>\n",
 464 |        "      <td>ESO4_uekv/l</td>\n",
 465 |        "      <td>-1679</td>\n",
 466 |        "      <td>-14.1516</td>\n",
 467 |        "      <td>14059.7</td>\n",
 468 |        "      <td>0</td>\n",
 469 |        "      <td>-2.06651</td>\n",
 470 |        "      <td>decreasing</td>\n",
 471 |        "    </tr>\n",
 472 |        "    <tr>\n",
 473 |        "      <th>7</th>\n",
 474 |        "      <td>IV</td>\n",
 475 |        "      <td>ECa-Mg_uekv/l</td>\n",
 476 |        "      <td>-711</td>\n",
 477 |        "      <td>-5.98785</td>\n",
 478 |        "      <td>14059.7</td>\n",
 479 |        "      <td>2.12634e-09</td>\n",
 480 |        "      <td>-0.511123</td>\n",
 481 |        "      <td>decreasing</td>\n",
 482 |        "    </tr>\n",
 483 |        "    <tr>\n",
 484 |        "      <th>8</th>\n",
 485 |        "      <td>IV</td>\n",
 486 |        "      <td>ANC_uekv/l</td>\n",
 487 |        "      <td>1315</td>\n",
 488 |        "      <td>11.0817</td>\n",
 489 |        "      <td>14059.7</td>\n",
 490 |        "      <td>0</td>\n",
 491 |        "      <td>1.94012</td>\n",
 492 |        "      <td>increasing</td>\n",
 493 |        "    </tr>\n",
 494 |        "    <tr>\n",
 495 |        "      <th>9</th>\n",
 496 |        "      <td>IV</td>\n",
 497 |        "      <td>pH</td>\n",
 498 |        "      <td>1137</td>\n",
 499 |        "      <td>9.5867</td>\n",
 500 |        "      <td>14041.7</td>\n",
 501 |        "      <td>0</td>\n",
 502 |        "      <td>0.0217647</td>\n",
 503 |        "      <td>increasing</td>\n",
 504 |        "    </tr>\n",
 505 |        "    <tr>\n",
 506 |        "      <th>10</th>\n",
 507 |        "      <td>IV</td>\n",
 508 |        "      <td>LAL_ug/l</td>\n",
 509 |        "      <td>-1066</td>\n",
 510 |        "      <td>-8.9855</td>\n",
 511 |        "      <td>14048</td>\n",
 512 |        "      <td>0</td>\n",
 513 |        "      <td>-2.66667</td>\n",
 514 |        "      <td>decreasing</td>\n",
 515 |        "    </tr>\n",
 516 |        "    <tr>\n",
 517 |        "      <th>11</th>\n",
 518 |        "      <td>IV</td>\n",
 519 |        "      <td>TOC_mg-C/l</td>\n",
 520 |        "      <td>981</td>\n",
 521 |        "      <td>8.27061</td>\n",
 522 |        "      <td>14040.3</td>\n",
 523 |        "      <td>2.22045e-16</td>\n",
 524 |        "      <td>0.0918182</td>\n",
 525 |        "      <td>increasing</td>\n",
 526 |        "    </tr>\n",
 527 |        "    <tr>\n",
 528 |        "      <th>12</th>\n",
 529 |        "      <td>II</td>\n",
 530 |        "      <td>ESO4_uekv/l</td>\n",
 531 |        "      <td>-2320</td>\n",
 532 |        "      <td>-16.0698</td>\n",
 533 |        "      <td>20824.7</td>\n",
 534 |        "      <td>0</td>\n",
 535 |        "      <td>-2.26966</td>\n",
 536 |        "      <td>decreasing</td>\n",
 537 |        "    </tr>\n",
 538 |        "    <tr>\n",
 539 |        "      <th>13</th>\n",
 540 |        "      <td>II</td>\n",
 541 |        "      <td>ECa-Mg_uekv/l</td>\n",
 542 |        "      <td>-1546</td>\n",
 543 |        "      <td>-10.7058</td>\n",
 544 |        "      <td>20826.7</td>\n",
 545 |        "      <td>0</td>\n",
 546 |        "      <td>-0.896604</td>\n",
 547 |        "      <td>decreasing</td>\n",
 548 |        "    </tr>\n",
 549 |        "    <tr>\n",
 550 |        "      <th>14</th>\n",
 551 |        "      <td>II</td>\n",
 552 |        "      <td>ANC_uekv/l</td>\n",
 553 |        "      <td>1788</td>\n",
 554 |        "      <td>12.3827</td>\n",
 555 |        "      <td>20826.7</td>\n",
 556 |        "      <td>0</td>\n",
 557 |        "      <td>1.75421</td>\n",
 558 |        "      <td>increasing</td>\n",
 559 |        "    </tr>\n",
 560 |        "    <tr>\n",
 561 |        "      <th>15</th>\n",
 562 |        "      <td>II</td>\n",
 563 |        "      <td>pH</td>\n",
 564 |        "      <td>1279</td>\n",
 565 |        "      <td>8.8597</td>\n",
 566 |        "      <td>20807.7</td>\n",
 567 |        "      <td>0</td>\n",
 568 |        "      <td>0.0142857</td>\n",
 569 |        "      <td>increasing</td>\n",
 570 |        "    </tr>\n",
 571 |        "    <tr>\n",
 572 |        "      <th>16</th>\n",
 573 |        "      <td>II</td>\n",
 574 |        "      <td>LAL_ug/l</td>\n",
 575 |        "      <td>-1201</td>\n",
 576 |        "      <td>-8.32044</td>\n",
 577 |        "      <td>20800.3</td>\n",
 578 |        "      <td>0</td>\n",
 579 |        "      <td>-2</td>\n",
 580 |        "      <td>decreasing</td>\n",
 581 |        "    </tr>\n",
 582 |        "    <tr>\n",
 583 |        "      <th>17</th>\n",
 584 |        "      <td>II</td>\n",
 585 |        "      <td>TOC_mg-C/l</td>\n",
 586 |        "      <td>1113</td>\n",
 587 |        "      <td>7.71126</td>\n",
 588 |        "      <td>20795</td>\n",
 589 |        "      <td>1.24345e-14</td>\n",
 590 |        "      <td>0.0861481</td>\n",
 591 |        "      <td>increasing</td>\n",
 592 |        "    </tr>\n",
 593 |        "    <tr>\n",
 594 |        "      <th>18</th>\n",
 595 |        "      <td>X</td>\n",
 596 |        "      <td>ESO4_uekv/l</td>\n",
 597 |        "      <td>-720</td>\n",
 598 |        "      <td>-8.66664</td>\n",
 599 |        "      <td>6882.67</td>\n",
 600 |        "      <td>0</td>\n",
 601 |        "      <td>-1.33067</td>\n",
 602 |        "      <td>decreasing</td>\n",
 603 |        "    </tr>\n",
 604 |        "    <tr>\n",
 605 |        "      <th>19</th>\n",
 606 |        "      <td>X</td>\n",
 607 |        "      <td>ECa-Mg_uekv/l</td>\n",
 608 |        "      <td>54</td>\n",
 609 |        "      <td>0.638848</td>\n",
 610 |        "      <td>6882.67</td>\n",
 611 |        "      <td>0.522922</td>\n",
 612 |        "      <td>0.0802304</td>\n",
 613 |        "      <td>no trend</td>\n",
 614 |        "    </tr>\n",
 615 |        "    <tr>\n",
 616 |        "      <th>20</th>\n",
 617 |        "      <td>X</td>\n",
 618 |        "      <td>ANC_uekv/l</td>\n",
 619 |        "      <td>700</td>\n",
 620 |        "      <td>8.42556</td>\n",
 621 |        "      <td>6882.67</td>\n",
 622 |        "      <td>0</td>\n",
 623 |        "      <td>1.92631</td>\n",
 624 |        "      <td>increasing</td>\n",
 625 |        "    </tr>\n",
 626 |        "    <tr>\n",
 627 |        "      <th>21</th>\n",
 628 |        "      <td>X</td>\n",
 629 |        "      <td>pH</td>\n",
 630 |        "      <td>693</td>\n",
 631 |        "      <td>8.34867</td>\n",
 632 |        "      <td>6870.33</td>\n",
 633 |        "      <td>0</td>\n",
 634 |        "      <td>0.02</td>\n",
 635 |        "      <td>increasing</td>\n",
 636 |        "    </tr>\n",
 637 |        "    <tr>\n",
 638 |        "      <th>22</th>\n",
 639 |        "      <td>X</td>\n",
 640 |        "      <td>LAL_ug/l</td>\n",
 641 |        "      <td>14</td>\n",
 642 |        "      <td>0.160384</td>\n",
 643 |        "      <td>6570</td>\n",
 644 |        "      <td>0.872579</td>\n",
 645 |        "      <td>0</td>\n",
 646 |        "      <td>no trend</td>\n",
 647 |        "    </tr>\n",
 648 |        "    <tr>\n",
 649 |        "      <th>23</th>\n",
 650 |        "      <td>X</td>\n",
 651 |        "      <td>TOC_mg-C/l</td>\n",
 652 |        "      <td>321</td>\n",
 653 |        "      <td>3.87459</td>\n",
 654 |        "      <td>6821</td>\n",
 655 |        "      <td>0.000106804</td>\n",
 656 |        "      <td>0.0131373</td>\n",
 657 |        "      <td>increasing</td>\n",
 658 |        "    </tr>\n",
 659 |        "    <tr>\n",
 660 |        "      <th>24</th>\n",
 661 |        "      <td>V</td>\n",
 662 |        "      <td>ESO4_uekv/l</td>\n",
 663 |        "      <td>-1374</td>\n",
 664 |        "      <td>-12.6771</td>\n",
 665 |        "      <td>11730</td>\n",
 666 |        "      <td>0</td>\n",
 667 |        "      <td>-1.64888</td>\n",
 668 |        "      <td>decreasing</td>\n",
 669 |        "    </tr>\n",
 670 |        "    <tr>\n",
 671 |        "      <th>25</th>\n",
 672 |        "      <td>V</td>\n",
 673 |        "      <td>ECa-Mg_uekv/l</td>\n",
 674 |        "      <td>-520</td>\n",
 675 |        "      <td>-4.79202</td>\n",
 676 |        "      <td>11730</td>\n",
 677 |        "      <td>1.65113e-06</td>\n",
 678 |        "      <td>-0.351444</td>\n",
 679 |        "      <td>decreasing</td>\n",
 680 |        "    </tr>\n",
 681 |        "    <tr>\n",
 682 |        "      <th>26</th>\n",
 683 |        "      <td>V</td>\n",
 684 |        "      <td>ANC_uekv/l</td>\n",
 685 |        "      <td>978</td>\n",
 686 |        "      <td>9.02081</td>\n",
 687 |        "      <td>11730</td>\n",
 688 |        "      <td>0</td>\n",
 689 |        "      <td>1.88999</td>\n",
 690 |        "      <td>increasing</td>\n",
 691 |        "    </tr>\n",
 692 |        "    <tr>\n",
 693 |        "      <th>27</th>\n",
 694 |        "      <td>V</td>\n",
 695 |        "      <td>pH</td>\n",
 696 |        "      <td>998</td>\n",
 697 |        "      <td>9.21123</td>\n",
 698 |        "      <td>11715.3</td>\n",
 699 |        "      <td>0</td>\n",
 700 |        "      <td>0.0215686</td>\n",
 701 |        "      <td>increasing</td>\n",
 702 |        "    </tr>\n",
 703 |        "    <tr>\n",
 704 |        "      <th>28</th>\n",
 705 |        "      <td>V</td>\n",
 706 |        "      <td>LAL_ug/l</td>\n",
 707 |        "      <td>-899</td>\n",
 708 |        "      <td>-8.29575</td>\n",
 709 |        "      <td>11717.7</td>\n",
 710 |        "      <td>0</td>\n",
 711 |        "      <td>-2.83333</td>\n",
 712 |        "      <td>decreasing</td>\n",
 713 |        "    </tr>\n",
 714 |        "    <tr>\n",
 715 |        "      <th>29</th>\n",
 716 |        "      <td>V</td>\n",
 717 |        "      <td>TOC_mg-C/l</td>\n",
 718 |        "      <td>950</td>\n",
 719 |        "      <td>8.77201</td>\n",
 720 |        "      <td>11704</td>\n",
 721 |        "      <td>0</td>\n",
 722 |        "      <td>0.0361111</td>\n",
 723 |        "      <td>increasing</td>\n",
 724 |        "    </tr>\n",
 725 |        "    <tr>\n",
 726 |        "      <th>30</th>\n",
 727 |        "      <td>III</td>\n",
 728 |        "      <td>ESO4_uekv/l</td>\n",
 729 |        "      <td>-671</td>\n",
 730 |        "      <td>-9.23721</td>\n",
 731 |        "      <td>5261</td>\n",
 732 |        "      <td>0</td>\n",
 733 |        "      <td>-0.862402</td>\n",
 734 |        "      <td>decreasing</td>\n",
 735 |        "    </tr>\n",
 736 |        "    <tr>\n",
 737 |        "      <th>31</th>\n",
 738 |        "      <td>III</td>\n",
 739 |        "      <td>ECa-Mg_uekv/l</td>\n",
 740 |        "      <td>-87</td>\n",
 741 |        "      <td>-1.18567</td>\n",
 742 |        "      <td>5261</td>\n",
 743 |        "      <td>0.235752</td>\n",
 744 |        "      <td>-0.105936</td>\n",
 745 |        "      <td>no trend</td>\n",
 746 |        "    </tr>\n",
 747 |        "    <tr>\n",
 748 |        "      <th>32</th>\n",
 749 |        "      <td>III</td>\n",
 750 |        "      <td>ANC_uekv/l</td>\n",
 751 |        "      <td>524</td>\n",
 752 |        "      <td>7.20985</td>\n",
 753 |        "      <td>5262</td>\n",
 754 |        "      <td>5.60219e-13</td>\n",
 755 |        "      <td>1.04387</td>\n",
 756 |        "      <td>increasing</td>\n",
 757 |        "    </tr>\n",
 758 |        "    <tr>\n",
 759 |        "      <th>33</th>\n",
 760 |        "      <td>III</td>\n",
 761 |        "      <td>pH</td>\n",
 762 |        "      <td>490</td>\n",
 763 |        "      <td>6.74371</td>\n",
 764 |        "      <td>5258</td>\n",
 765 |        "      <td>1.54399e-11</td>\n",
 766 |        "      <td>0.0233333</td>\n",
 767 |        "      <td>increasing</td>\n",
 768 |        "    </tr>\n",
 769 |        "    <tr>\n",
 770 |        "      <th>34</th>\n",
 771 |        "      <td>III</td>\n",
 772 |        "      <td>LAL_ug/l</td>\n",
 773 |        "      <td>-208</td>\n",
 774 |        "      <td>-2.8669</td>\n",
 775 |        "      <td>5213.33</td>\n",
 776 |        "      <td>0.00414514</td>\n",
 777 |        "      <td>-0.140688</td>\n",
 778 |        "      <td>decreasing</td>\n",
 779 |        "    </tr>\n",
 780 |        "    <tr>\n",
 781 |        "      <th>35</th>\n",
 782 |        "      <td>III</td>\n",
 783 |        "      <td>TOC_mg-C/l</td>\n",
 784 |        "      <td>324</td>\n",
 785 |        "      <td>4.45443</td>\n",
 786 |        "      <td>5258</td>\n",
 787 |        "      <td>8.4116e-06</td>\n",
 788 |        "      <td>0.0103509</td>\n",
 789 |        "      <td>increasing</td>\n",
 790 |        "    </tr>\n",
 791 |        "    <tr>\n",
 792 |        "      <th>36</th>\n",
 793 |        "      <td>VII</td>\n",
 794 |        "      <td>ESO4_uekv/l</td>\n",
 795 |        "      <td>-1209</td>\n",
 796 |        "      <td>-11.5068</td>\n",
 797 |        "      <td>11021</td>\n",
 798 |        "      <td>0</td>\n",
 799 |        "      <td>-0.424367</td>\n",
 800 |        "      <td>decreasing</td>\n",
 801 |        "    </tr>\n",
 802 |        "    <tr>\n",
 803 |        "      <th>37</th>\n",
 804 |        "      <td>VII</td>\n",
 805 |        "      <td>ECa-Mg_uekv/l</td>\n",
 806 |        "      <td>16</td>\n",
 807 |        "      <td>0.142877</td>\n",
 808 |        "      <td>11022</td>\n",
 809 |        "      <td>0.886388</td>\n",
 810 |        "      <td>0.00263083</td>\n",
 811 |        "      <td>no trend</td>\n",
 812 |        "    </tr>\n",
 813 |        "    <tr>\n",
 814 |        "      <th>38</th>\n",
 815 |        "      <td>VII</td>\n",
 816 |        "      <td>ANC_uekv/l</td>\n",
 817 |        "      <td>941</td>\n",
 818 |        "      <td>8.95319</td>\n",
 819 |        "      <td>11023</td>\n",
 820 |        "      <td>0</td>\n",
 821 |        "      <td>0.646314</td>\n",
 822 |        "      <td>increasing</td>\n",
 823 |        "    </tr>\n",
 824 |        "    <tr>\n",
 825 |        "      <th>39</th>\n",
 826 |        "      <td>VII</td>\n",
 827 |        "      <td>pH</td>\n",
 828 |        "      <td>1020</td>\n",
 829 |        "      <td>9.70961</td>\n",
 830 |        "      <td>11014</td>\n",
 831 |        "      <td>0</td>\n",
 832 |        "      <td>0.0188889</td>\n",
 833 |        "      <td>increasing</td>\n",
 834 |        "    </tr>\n",
 835 |        "    <tr>\n",
 836 |        "      <th>40</th>\n",
 837 |        "      <td>VII</td>\n",
 838 |        "      <td>LAL_ug/l</td>\n",
 839 |        "      <td>-588</td>\n",
 840 |        "      <td>-5.60328</td>\n",
 841 |        "      <td>10974.7</td>\n",
 842 |        "      <td>2.10331e-08</td>\n",
 843 |        "      <td>-0.333333</td>\n",
 844 |        "      <td>decreasing</td>\n",
 845 |        "    </tr>\n",
 846 |        "    <tr>\n",
 847 |        "      <th>41</th>\n",
 848 |        "      <td>VII</td>\n",
 849 |        "      <td>TOC_mg-C/l</td>\n",
 850 |        "      <td>60</td>\n",
 851 |        "      <td>0.56239</td>\n",
 852 |        "      <td>11006</td>\n",
 853 |        "      <td>0.573851</td>\n",
 854 |        "      <td>0.00102564</td>\n",
 855 |        "      <td>no trend</td>\n",
 856 |        "    </tr>\n",
 857 |        "    <tr>\n",
 858 |        "      <th>42</th>\n",
 859 |        "      <td>VI</td>\n",
 860 |        "      <td>ESO4_uekv/l</td>\n",
 861 |        "      <td>-892</td>\n",
 862 |        "      <td>-9.70852</td>\n",
 863 |        "      <td>8422.67</td>\n",
 864 |        "      <td>0</td>\n",
 865 |        "      <td>-0.906736</td>\n",
 866 |        "      <td>decreasing</td>\n",
 867 |        "    </tr>\n",
 868 |        "    <tr>\n",
 869 |        "      <th>43</th>\n",
 870 |        "      <td>VI</td>\n",
 871 |        "      <td>ECa-Mg_uekv/l</td>\n",
 872 |        "      <td>-150</td>\n",
 873 |        "      <td>-1.62353</td>\n",
 874 |        "      <td>8422.67</td>\n",
 875 |        "      <td>0.104475</td>\n",
 876 |        "      <td>-0.104055</td>\n",
 877 |        "      <td>no trend</td>\n",
 878 |        "    </tr>\n",
 879 |        "    <tr>\n",
 880 |        "      <th>44</th>\n",
 881 |        "      <td>VI</td>\n",
 882 |        "      <td>ANC_uekv/l</td>\n",
 883 |        "      <td>704</td>\n",
 884 |        "      <td>7.66003</td>\n",
 885 |        "      <td>8422.67</td>\n",
 886 |        "      <td>1.86517e-14</td>\n",
 887 |        "      <td>1.11682</td>\n",
 888 |        "      <td>increasing</td>\n",
 889 |        "    </tr>\n",
 890 |        "    <tr>\n",
 891 |        "      <th>45</th>\n",
 892 |        "      <td>VI</td>\n",
 893 |        "      <td>pH</td>\n",
 894 |        "      <td>730</td>\n",
 895 |        "      <td>7.94522</td>\n",
 896 |        "      <td>8418.67</td>\n",
 897 |        "      <td>1.9984e-15</td>\n",
 898 |        "      <td>0.0269048</td>\n",
 899 |        "      <td>increasing</td>\n",
 900 |        "    </tr>\n",
 901 |        "    <tr>\n",
 902 |        "      <th>46</th>\n",
 903 |        "      <td>VI</td>\n",
 904 |        "      <td>LAL_ug/l</td>\n",
 905 |        "      <td>-651</td>\n",
 906 |        "      <td>-7.09391</td>\n",
 907 |        "      <td>8395.67</td>\n",
 908 |        "      <td>1.30385e-12</td>\n",
 909 |        "      <td>-1.5</td>\n",
 910 |        "      <td>decreasing</td>\n",
 911 |        "    </tr>\n",
 912 |        "    <tr>\n",
 913 |        "      <th>47</th>\n",
 914 |        "      <td>VI</td>\n",
 915 |        "      <td>TOC_mg-C/l</td>\n",
 916 |        "      <td>565</td>\n",
 917 |        "      <td>6.15533</td>\n",
 918 |        "      <td>8395.67</td>\n",
 919 |        "      <td>7.49202e-10</td>\n",
 920 |        "      <td>0.020875</td>\n",
 921 |        "      <td>increasing</td>\n",
 922 |        "    </tr>\n",
 923 |        "    <tr>\n",
 924 |        "      <th>48</th>\n",
 925 |        "      <td>IX</td>\n",
 926 |        "      <td>ESO4_uekv/l</td>\n",
 927 |        "      <td>-34</td>\n",
 928 |        "      <td>-0.996498</td>\n",
 929 |        "      <td>1096.67</td>\n",
 930 |        "      <td>0.319008</td>\n",
 931 |        "      <td>-0.0524026</td>\n",
 932 |        "      <td>no trend</td>\n",
 933 |        "    </tr>\n",
 934 |        "    <tr>\n",
 935 |        "      <th>49</th>\n",
 936 |        "      <td>IX</td>\n",
 937 |        "      <td>ECa-Mg_uekv/l</td>\n",
 938 |        "      <td>90</td>\n",
 939 |        "      <td>2.68753</td>\n",
 940 |        "      <td>1096.67</td>\n",
 941 |        "      <td>0.00719835</td>\n",
 942 |        "      <td>0.436464</td>\n",
 943 |        "      <td>increasing</td>\n",
 944 |        "    </tr>\n",
 945 |        "    <tr>\n",
 946 |        "      <th>50</th>\n",
 947 |        "      <td>IX</td>\n",
 948 |        "      <td>ANC_uekv/l</td>\n",
 949 |        "      <td>90</td>\n",
 950 |        "      <td>2.68753</td>\n",
 951 |        "      <td>1096.67</td>\n",
 952 |        "      <td>0.00719835</td>\n",
 953 |        "      <td>0.484974</td>\n",
 954 |        "      <td>increasing</td>\n",
 955 |        "    </tr>\n",
 956 |        "    <tr>\n",
 957 |        "      <th>51</th>\n",
 958 |        "      <td>IX</td>\n",
 959 |        "      <td>pH</td>\n",
 960 |        "      <td>66</td>\n",
 961 |        "      <td>1.96459</td>\n",
 962 |        "      <td>1094.67</td>\n",
 963 |        "      <td>0.0494615</td>\n",
 964 |        "      <td>0.00563492</td>\n",
 965 |        "      <td>increasing</td>\n",
 966 |        "    </tr>\n",
 967 |        "    <tr>\n",
 968 |        "      <th>52</th>\n",
 969 |        "      <td>IX</td>\n",
 970 |        "      <td>LAL_ug/l</td>\n",
 971 |        "      <td>87</td>\n",
 972 |        "      <td>2.60926</td>\n",
 973 |        "      <td>1086.33</td>\n",
 974 |        "      <td>0.0090739</td>\n",
 975 |        "      <td>0.181818</td>\n",
 976 |        "      <td>increasing</td>\n",
 977 |        "    </tr>\n",
 978 |        "    <tr>\n",
 979 |        "      <th>53</th>\n",
 980 |        "      <td>IX</td>\n",
 981 |        "      <td>TOC_mg-C/l</td>\n",
 982 |        "      <td>41</td>\n",
 983 |        "      <td>1.20843</td>\n",
 984 |        "      <td>1095.67</td>\n",
 985 |        "      <td>0.226883</td>\n",
 986 |        "      <td>0.00325397</td>\n",
 987 |        "      <td>no trend</td>\n",
 988 |        "    </tr>\n",
 989 |        "    <tr>\n",
 990 |        "      <th>54</th>\n",
 991 |        "      <td>VIII</td>\n",
 992 |        "      <td>ESO4_uekv/l</td>\n",
 993 |        "      <td>-469</td>\n",
 994 |        "      <td>-5.20439</td>\n",
 995 |        "      <td>8086.33</td>\n",
 996 |        "      <td>1.94632e-07</td>\n",
 997 |        "      <td>-0.203925</td>\n",
 998 |        "      <td>decreasing</td>\n",
 999 |        "    </tr>\n",
1000 |        "    <tr>\n",
1001 |        "      <th>55</th>\n",
1002 |        "      <td>VIII</td>\n",
1003 |        "      <td>ECa-Mg_uekv/l</td>\n",
1004 |        "      <td>265</td>\n",
1005 |        "      <td>2.9346</td>\n",
1006 |        "      <td>8093</td>\n",
1007 |        "      <td>0.00333976</td>\n",
1008 |        "      <td>0.209264</td>\n",
1009 |        "      <td>increasing</td>\n",
1010 |        "    </tr>\n",
1011 |        "    <tr>\n",
1012 |        "      <th>56</th>\n",
1013 |        "      <td>VIII</td>\n",
1014 |        "      <td>ANC_uekv/l</td>\n",
1015 |        "      <td>613</td>\n",
1016 |        "      <td>6.80294</td>\n",
1017 |        "      <td>8093</td>\n",
1018 |        "      <td>1.02505e-11</td>\n",
1019 |        "      <td>0.729263</td>\n",
1020 |        "      <td>increasing</td>\n",
1021 |        "    </tr>\n",
1022 |        "    <tr>\n",
1023 |        "      <th>57</th>\n",
1024 |        "      <td>VIII</td>\n",
1025 |        "      <td>pH</td>\n",
1026 |        "      <td>397</td>\n",
1027 |        "      <td>4.40372</td>\n",
1028 |        "      <td>8086.33</td>\n",
1029 |        "      <td>1.06412e-05</td>\n",
1030 |        "      <td>0.00923077</td>\n",
1031 |        "      <td>increasing</td>\n",
1032 |        "    </tr>\n",
1033 |        "    <tr>\n",
1034 |        "      <th>58</th>\n",
1035 |        "      <td>VIII</td>\n",
1036 |        "      <td>LAL_ug/l</td>\n",
1037 |        "      <td>289</td>\n",
1038 |        "      <td>3.2735</td>\n",
1039 |        "      <td>7740.33</td>\n",
1040 |        "      <td>0.00106224</td>\n",
1041 |        "      <td>0.0333333</td>\n",
1042 |        "      <td>increasing</td>\n",
1043 |        "    </tr>\n",
1044 |        "    <tr>\n",
1045 |        "      <th>59</th>\n",
1046 |        "      <td>VIII</td>\n",
1047 |        "      <td>TOC_mg-C/l</td>\n",
1048 |        "      <td>196</td>\n",
1049 |        "      <td>2.17042</td>\n",
1050 |        "      <td>8072</td>\n",
1051 |        "      <td>0.0299749</td>\n",
1052 |        "      <td>0.0047</td>\n",
1053 |        "      <td>increasing</td>\n",
1054 |        "    </tr>\n",
1055 |        "  </tbody>\n",
1056 |        "</table>\n",
1057 |        "</div>"
1058 |       ],
1059 |       "text/plain": [
1060 |        "   region      parameter     s          z    var_s            p        sslp  \\\n",
1061 |        "0       I    ESO4_uekv/l  -991   -11.6353  7239.67            0    -0.84127   \n",
1062 |        "1       I  ECa-Mg_uekv/l   -60  -0.693366  7240.67      0.48808  -0.0442908   \n",
1063 |        "2       I     ANC_uekv/l   705    8.27282  7241.67  2.22045e-16     1.12356   \n",
1064 |        "3       I             pH   657    7.71338     7233  1.22125e-14   0.0152632   \n",
1065 |        "4       I       LAL_ug/l    -8 -0.0826413  7174.67     0.934137           0   \n",
1066 |        "5       I     TOC_mg-C/l   387    4.54579  7210.33  5.47289e-06   0.0266667   \n",
1067 |        "6      IV    ESO4_uekv/l -1679   -14.1516  14059.7            0    -2.06651   \n",
1068 |        "7      IV  ECa-Mg_uekv/l  -711   -5.98785  14059.7  2.12634e-09   -0.511123   \n",
1069 |        "8      IV     ANC_uekv/l  1315    11.0817  14059.7            0     1.94012   \n",
1070 |        "9      IV             pH  1137     9.5867  14041.7            0   0.0217647   \n",
1071 |        "10     IV       LAL_ug/l -1066    -8.9855    14048            0    -2.66667   \n",
1072 |        "11     IV     TOC_mg-C/l   981    8.27061  14040.3  2.22045e-16   0.0918182   \n",
1073 |        "12     II    ESO4_uekv/l -2320   -16.0698  20824.7            0    -2.26966   \n",
1074 |        "13     II  ECa-Mg_uekv/l -1546   -10.7058  20826.7            0   -0.896604   \n",
1075 |        "14     II     ANC_uekv/l  1788    12.3827  20826.7            0     1.75421   \n",
1076 |        "15     II             pH  1279     8.8597  20807.7            0   0.0142857   \n",
1077 |        "16     II       LAL_ug/l -1201   -8.32044  20800.3            0          -2   \n",
1078 |        "17     II     TOC_mg-C/l  1113    7.71126    20795  1.24345e-14   0.0861481   \n",
1079 |        "18      X    ESO4_uekv/l  -720   -8.66664  6882.67            0    -1.33067   \n",
1080 |        "19      X  ECa-Mg_uekv/l    54   0.638848  6882.67     0.522922   0.0802304   \n",
1081 |        "20      X     ANC_uekv/l   700    8.42556  6882.67            0     1.92631   \n",
1082 |        "21      X             pH   693    8.34867  6870.33            0        0.02   \n",
1083 |        "22      X       LAL_ug/l    14   0.160384     6570     0.872579           0   \n",
1084 |        "23      X     TOC_mg-C/l   321    3.87459     6821  0.000106804   0.0131373   \n",
1085 |        "24      V    ESO4_uekv/l -1374   -12.6771    11730            0    -1.64888   \n",
1086 |        "25      V  ECa-Mg_uekv/l  -520   -4.79202    11730  1.65113e-06   -0.351444   \n",
1087 |        "26      V     ANC_uekv/l   978    9.02081    11730            0     1.88999   \n",
1088 |        "27      V             pH   998    9.21123  11715.3            0   0.0215686   \n",
1089 |        "28      V       LAL_ug/l  -899   -8.29575  11717.7            0    -2.83333   \n",
1090 |        "29      V     TOC_mg-C/l   950    8.77201    11704            0   0.0361111   \n",
1091 |        "30    III    ESO4_uekv/l  -671   -9.23721     5261            0   -0.862402   \n",
1092 |        "31    III  ECa-Mg_uekv/l   -87   -1.18567     5261     0.235752   -0.105936   \n",
1093 |        "32    III     ANC_uekv/l   524    7.20985     5262  5.60219e-13     1.04387   \n",
1094 |        "33    III             pH   490    6.74371     5258  1.54399e-11   0.0233333   \n",
1095 |        "34    III       LAL_ug/l  -208    -2.8669  5213.33   0.00414514   -0.140688   \n",
1096 |        "35    III     TOC_mg-C/l   324    4.45443     5258   8.4116e-06   0.0103509   \n",
1097 |        "36    VII    ESO4_uekv/l -1209   -11.5068    11021            0   -0.424367   \n",
1098 |        "37    VII  ECa-Mg_uekv/l    16   0.142877    11022     0.886388  0.00263083   \n",
1099 |        "38    VII     ANC_uekv/l   941    8.95319    11023            0    0.646314   \n",
1100 |        "39    VII             pH  1020    9.70961    11014            0   0.0188889   \n",
1101 |        "40    VII       LAL_ug/l  -588   -5.60328  10974.7  2.10331e-08   -0.333333   \n",
1102 |        "41    VII     TOC_mg-C/l    60    0.56239    11006     0.573851  0.00102564   \n",
1103 |        "42     VI    ESO4_uekv/l  -892   -9.70852  8422.67            0   -0.906736   \n",
1104 |        "43     VI  ECa-Mg_uekv/l  -150   -1.62353  8422.67     0.104475   -0.104055   \n",
1105 |        "44     VI     ANC_uekv/l   704    7.66003  8422.67  1.86517e-14     1.11682   \n",
1106 |        "45     VI             pH   730    7.94522  8418.67   1.9984e-15   0.0269048   \n",
1107 |        "46     VI       LAL_ug/l  -651   -7.09391  8395.67  1.30385e-12        -1.5   \n",
1108 |        "47     VI     TOC_mg-C/l   565    6.15533  8395.67  7.49202e-10    0.020875   \n",
1109 |        "48     IX    ESO4_uekv/l   -34  -0.996498  1096.67     0.319008  -0.0524026   \n",
1110 |        "49     IX  ECa-Mg_uekv/l    90    2.68753  1096.67   0.00719835    0.436464   \n",
1111 |        "50     IX     ANC_uekv/l    90    2.68753  1096.67   0.00719835    0.484974   \n",
1112 |        "51     IX             pH    66    1.96459  1094.67    0.0494615  0.00563492   \n",
1113 |        "52     IX       LAL_ug/l    87    2.60926  1086.33    0.0090739    0.181818   \n",
1114 |        "53     IX     TOC_mg-C/l    41    1.20843  1095.67     0.226883  0.00325397   \n",
1115 |        "54   VIII    ESO4_uekv/l  -469   -5.20439  8086.33  1.94632e-07   -0.203925   \n",
1116 |        "55   VIII  ECa-Mg_uekv/l   265     2.9346     8093   0.00333976    0.209264   \n",
1117 |        "56   VIII     ANC_uekv/l   613    6.80294     8093  1.02505e-11    0.729263   \n",
1118 |        "57   VIII             pH   397    4.40372  8086.33  1.06412e-05  0.00923077   \n",
1119 |        "58   VIII       LAL_ug/l   289     3.2735  7740.33   0.00106224   0.0333333   \n",
1120 |        "59   VIII     TOC_mg-C/l   196    2.17042     8072    0.0299749      0.0047   \n",
1121 |        "\n",
1122 |        "         trend  \n",
1123 |        "0   decreasing  \n",
1124 |        "1     no trend  \n",
1125 |        "2   increasing  \n",
1126 |        "3   increasing  \n",
1127 |        "4     no trend  \n",
1128 |        "5   increasing  \n",
1129 |        "6   decreasing  \n",
1130 |        "7   decreasing  \n",
1131 |        "8   increasing  \n",
1132 |        "9   increasing  \n",
1133 |        "10  decreasing  \n",
1134 |        "11  increasing  \n",
1135 |        "12  decreasing  \n",
1136 |        "13  decreasing  \n",
1137 |        "14  increasing  \n",
1138 |        "15  increasing  \n",
1139 |        "16  decreasing  \n",
1140 |        "17  increasing  \n",
1141 |        "18  decreasing  \n",
1142 |        "19    no trend  \n",
1143 |        "20  increasing  \n",
1144 |        "21  increasing  \n",
1145 |        "22    no trend  \n",
1146 |        "23  increasing  \n",
1147 |        "24  decreasing  \n",
1148 |        "25  decreasing  \n",
1149 |        "26  increasing  \n",
1150 |        "27  increasing  \n",
1151 |        "28  decreasing  \n",
1152 |        "29  increasing  \n",
1153 |        "30  decreasing  \n",
1154 |        "31    no trend  \n",
1155 |        "32  increasing  \n",
1156 |        "33  increasing  \n",
1157 |        "34  decreasing  \n",
1158 |        "35  increasing  \n",
1159 |        "36  decreasing  \n",
1160 |        "37    no trend  \n",
1161 |        "38  increasing  \n",
1162 |        "39  increasing  \n",
1163 |        "40  decreasing  \n",
1164 |        "41    no trend  \n",
1165 |        "42  decreasing  \n",
1166 |        "43    no trend  \n",
1167 |        "44  increasing  \n",
1168 |        "45  increasing  \n",
1169 |        "46  decreasing  \n",
1170 |        "47  increasing  \n",
1171 |        "48    no trend  \n",
1172 |        "49  increasing  \n",
1173 |        "50  increasing  \n",
1174 |        "51  increasing  \n",
1175 |        "52  increasing  \n",
1176 |        "53    no trend  \n",
1177 |        "54  decreasing  \n",
1178 |        "55  increasing  \n",
1179 |        "56  increasing  \n",
1180 |        "57  increasing  \n",
1181 |        "58  increasing  \n",
1182 |        "59  increasing  "
1183 |       ]
1184 |      },
1185 |      "execution_count": 5,
1186 |      "metadata": {},
1187 |      "output_type": "execute_result"
1188 |     }
1189 |    ],
1190 |    "source": [
1191 |     "# Pars to plot\n",
1192 |     "pars = [\"ESO4_uekv/l\", \"ECa-Mg_uekv/l\", \"ANC_uekv/l\", \"pH\", \"LAL_ug/l\", \"TOC_mg-C/l\"]\n",
1193 |     "\n",
1194 |     "res_list = []\n",
1195 |     "\n",
1196 |     "# Loop over regions\n",
1197 |     "for reg in agg[\"region\"].unique():\n",
1198 |     "    reg_df = agg.query(\"region == @reg\")\n",
1199 |     "\n",
1200 |     "    # Loop over pars\n",
1201 |     "    for par in pars:\n",
1202 |     "        res_df = nivapy.stats.seasonal_regional_mk_sen(\n",
1203 |     "            reg_df, time_col=\"year\", value_col=par, block_col=\"station_name\"\n",
1204 |     "        ).T.loc['value']\n",
1205 |     "        res_df['region'] = reg\n",
1206 |     "        res_df['parameter'] = par\n",
1207 |     "        res_list.append(res_df)\n",
1208 |     "\n",
1209 |     "res_df = pd.concat(res_list, axis=1, sort=False).T.reset_index(drop=True)\n",
1210 |     "res_df = res_df[['region', 'parameter', 's', 'z', 'var_s', 'p', 'sslp', 'trend']]\n",
1211 |     "res_df.to_csv('regional_mk_trends.csv', index=False)\n",
1212 |     "\n",
1213 |     "res_df"
1214 |    ]
1215 |   }
1216 |  ],
1217 |  "metadata": {
1218 |   "kernelspec": {
1219 |    "display_name": "Python 3",
1220 |    "language": "python",
1221 |    "name": "python3"
1222 |   },
1223 |   "language_info": {
1224 |    "codemirror_mode": {
1225 |     "name": "ipython",
1226 |     "version": 3
1227 |    },
1228 |    "file_extension": ".py",
1229 |    "mimetype": "text/x-python",
1230 |    "name": "python",
1231 |    "nbconvert_exporter": "python",
1232 |    "pygments_lexer": "ipython3",
1233 |    "version": "3.7.6"
1234 |   }
1235 |  },
1236 |  "nbformat": 4,
1237 |  "nbformat_minor": 4
1238 | }
1239 | 


--------------------------------------------------------------------------------
/notebooks/update_db_2018_report.ipynb:
--------------------------------------------------------------------------------
   1 | {
   2 |  "cells": [
   3 |   {
   4 |    "cell_type": "code",
   5 |    "execution_count": 1,
   6 |    "metadata": {},
   7 |    "outputs": [],
   8 |    "source": [
   9 |     "%matplotlib inline\n",
  10 |     "\n",
  11 |     "import pandas as pd\n",
  12 |     "import nivapy3 as nivapy\n",
  13 |     "import matplotlib.pyplot as plt\n",
  14 |     "import datetime as dt\n",
  15 |     "import numpy as np\n",
  16 |     "from sqlalchemy import text\n",
  17 |     "\n",
  18 |     "plt.style.use('ggplot')"
  19 |    ]
  20 |   },
  21 |   {
  22 |    "cell_type": "code",
  23 |    "execution_count": 6,
  24 |    "metadata": {},
  25 |    "outputs": [
  26 |     {
  27 |      "name": "stdin",
  28 |      "output_type": "stream",
  29 |      "text": [
  30 |       "Username:  ···\n",
  31 |       "Password:  ········\n"
  32 |      ]
  33 |     },
  34 |     {
  35 |      "name": "stdout",
  36 |      "output_type": "stream",
  37 |      "text": [
  38 |       "Connection successful.\n"
  39 |      ]
  40 |     }
  41 |    ],
  42 |    "source": [
  43 |     "# Connect to Oracle\n",
  44 |     "eng = nivapy.da.connect()"
  45 |    ]
  46 |   },
  47 |   {
  48 |    "cell_type": "markdown",
  49 |    "metadata": {},
  50 |    "source": [
  51 |     "# Biolok: updates for the 2018 report\n",
  52 |     "\n",
  53 |     "This notebook describes data processing and RESA2 updates for 2018 Biolok report. Data sources are as follows:\n",
  54 |     "\n",
  55 |     " * All data prior to 2015 are stored in RESA2 as a **dataset** named `BIOLOK rapp2015` (project ID 4030). This dataset comprisies 43 stations, but only a subset of water samples from each site are included. Relevant data can be exported via the RESA2 application, but it is important to **remember to check the box** labelled *Use only water samples from selected projects*, otherwise all samples will be returned. Within the RESA2 database, relevant samples are associated with `SAMPLE_SELECTION_ID` 62 in the `RESA2.SAMPLE_SELECTIONS` table\n",
  56 |     " \n",
  57 |     " * From 2015 onwards, the project comprises 42 stations (two have been removed from the original project and one added). Most of the data are stored in both RESA2 and Aquamonitor, but we also receive data from an external laboratory named Faun. Liv Bente has compiled a spreadsheet here\n",
  58 |     " \n",
  59 |     "         K:\\Prosjekter\\langtransporterte forurensninger\\O-190033-7 BIOLOK_rapp 2014-18\\Samlede prøver ulike kilder_til RESA_JES_nov19.xlsx\n",
  60 |     "         \n",
  61 |     "   listing relevant samples since 2015\n",
  62 |     "   \n",
  63 |     "The general workflow is as follows:\n",
  64 |     "\n",
  65 |     " 1. Create a new dataset for the 2018 report in the `RESA2.PROJECTS` table\n",
  66 |     " \n",
  67 |     " 2. Add the 42 stations in the current project to `PROJECTS_STATIONS`\n",
  68 |     " \n",
  69 |     " 3. Create a new `SAMPLE_SELECTION_ID` in `RESA2.SAMPLE_SELECTION_DEFINITIONS`\n",
  70 |     " \n",
  71 |     " 4. Update the new sample selection in `RESA2.SAMPLE_SELECTIONS` to include pre-2015 water samples from the 41 \"common\" stations\n",
  72 |     " \n",
  73 |     " 5. Check whether all non-Faun samples are already present in RESA, or whether some data need to be transferred from AM\n",
  74 |     " \n",
  75 |     " 6. Update the new sample selection to include relevant samples from 2015 onwards for the 41 common sites (based on Liv Bente's spreadsheet)\n",
  76 |     " \n",
  77 |     " 7. Also add relevant samples from all years for Stakksheitjørna, which is the new station added to the project since 2014 (based on Liv Bente's spreadsheet)\n",
  78 |     " \n",
  79 |     " 8. Add data from Faun to RESA and link to the sample selection (based on Liv Bente's spreadsheet)"
  80 |    ]
  81 |   },
  82 |   {
  83 |    "cell_type": "markdown",
  84 |    "metadata": {},
  85 |    "source": [
  86 |     "## 1. Create dataset\n",
  87 |     "\n",
  88 |     "There is no real distinction between \"projects\" and \"datasets\" in RESA: both are stored in the `PROJECTS` table. The column named `PROJECT_OR_DATASET` in this table can be used to determine which table the project/dataset is shown in on the *Select project* window of the RESA2 application.\n",
  89 |     "\n",
  90 |     "**The new project created below has `PROJECT_ID` 4490**."
  91 |    ]
  92 |   },
  93 |   {
  94 |    "cell_type": "code",
  95 |    "execution_count": 3,
  96 |    "metadata": {},
  97 |    "outputs": [],
  98 |    "source": [
  99 |     "## Create a new dataset\n",
 100 |     "#sql = (\"INSERT INTO resa2.projects \"\n",
 101 |     "#       \"  (project_name, contact_person, project_or_dataset, \"\n",
 102 |     "#       \"   contact_person_initials, project_description) \"\n",
 103 |     "#       \"VALUES \"\n",
 104 |     "#       \"  ('BIOLOK rapp2018', 'Liv Bente Skancke', 'Dataset', \"\n",
 105 |     "#       \"   'LBS', 'Stations included in the Biolok report (data up to 2018; written during 2020)')\"\n",
 106 |     "#      )\n",
 107 |     "#eng.execute(sql)"
 108 |    ]
 109 |   },
 110 |   {
 111 |    "cell_type": "markdown",
 112 |    "metadata": {},
 113 |    "source": [
 114 |     "## 2. Add stations\n",
 115 |     "\n",
 116 |     "The stations involved in the project since 2015 are listed in the `stations` worksheet of `../project_overview_from_lbs.xlsx`."
 117 |    ]
 118 |   },
 119 |   {
 120 |    "cell_type": "code",
 121 |    "execution_count": 4,
 122 |    "metadata": {},
 123 |    "outputs": [
 124 |     {
 125 |      "data": {
 126 |       "text/html": [
 127 |        "<div>\n",
 128 |        "<style scoped>\n",
 129 |        "    .dataframe tbody tr th:only-of-type {\n",
 130 |        "        vertical-align: middle;\n",
 131 |        "    }\n",
 132 |        "\n",
 133 |        "    .dataframe tbody tr th {\n",
 134 |        "        vertical-align: top;\n",
 135 |        "    }\n",
 136 |        "\n",
 137 |        "    .dataframe thead th {\n",
 138 |        "        text-align: right;\n",
 139 |        "    }\n",
 140 |        "</style>\n",
 141 |        "<table border=\"1\" class=\"dataframe\">\n",
 142 |        "  <thead>\n",
 143 |        "    <tr style=\"text-align: right;\">\n",
 144 |        "      <th></th>\n",
 145 |        "      <th>station_id</th>\n",
 146 |        "      <th>station_code</th>\n",
 147 |        "      <th>station_name</th>\n",
 148 |        "      <th>region</th>\n",
 149 |        "      <th>biolok_code</th>\n",
 150 |        "      <th>nve_vatn_nr</th>\n",
 151 |        "      <th>elevation_m</th>\n",
 152 |        "      <th>fylke</th>\n",
 153 |        "      <th>kommune</th>\n",
 154 |        "    </tr>\n",
 155 |        "  </thead>\n",
 156 |        "  <tbody>\n",
 157 |        "    <tr>\n",
 158 |        "      <th>0</th>\n",
 159 |        "      <td>42</td>\n",
 160 |        "      <td>1003-2-4</td>\n",
 161 |        "      <td>Saudlandsvatnet</td>\n",
 162 |        "      <td>5</td>\n",
 163 |        "      <td>V-1</td>\n",
 164 |        "      <td>21894</td>\n",
 165 |        "      <td>106.0</td>\n",
 166 |        "      <td>Vest-Agder</td>\n",
 167 |        "      <td>Farsund kommune</td>\n",
 168 |        "    </tr>\n",
 169 |        "    <tr>\n",
 170 |        "      <th>1</th>\n",
 171 |        "      <td>192</td>\n",
 172 |        "      <td>1014-12</td>\n",
 173 |        "      <td>Sognevatn</td>\n",
 174 |        "      <td>4</td>\n",
 175 |        "      <td>IV-9</td>\n",
 176 |        "      <td>11078</td>\n",
 177 |        "      <td>267.0</td>\n",
 178 |        "      <td>Vest-Agder</td>\n",
 179 |        "      <td>Vennesla kommune</td>\n",
 180 |        "    </tr>\n",
 181 |        "    <tr>\n",
 182 |        "      <th>2</th>\n",
 183 |        "      <td>182</td>\n",
 184 |        "      <td>1014-25</td>\n",
 185 |        "      <td>Drivenesvatn</td>\n",
 186 |        "      <td>4</td>\n",
 187 |        "      <td>IV-8</td>\n",
 188 |        "      <td>11147</td>\n",
 189 |        "      <td>176.0</td>\n",
 190 |        "      <td>Vest-Agder</td>\n",
 191 |        "      <td>Vennesla kommune</td>\n",
 192 |        "    </tr>\n",
 193 |        "    <tr>\n",
 194 |        "      <th>3</th>\n",
 195 |        "      <td>166</td>\n",
 196 |        "      <td>1018-4</td>\n",
 197 |        "      <td>Kleivsetvannet</td>\n",
 198 |        "      <td>4</td>\n",
 199 |        "      <td>IV-10</td>\n",
 200 |        "      <td>11592</td>\n",
 201 |        "      <td>93.0</td>\n",
 202 |        "      <td>Vest-Agder</td>\n",
 203 |        "      <td>Søgne kommune</td>\n",
 204 |        "    </tr>\n",
 205 |        "    <tr>\n",
 206 |        "      <th>4</th>\n",
 207 |        "      <td>118</td>\n",
 208 |        "      <td>1034-19</td>\n",
 209 |        "      <td>Indre Espelandsvatnet</td>\n",
 210 |        "      <td>5</td>\n",
 211 |        "      <td>V-2</td>\n",
 212 |        "      <td>11095</td>\n",
 213 |        "      <td>389.0</td>\n",
 214 |        "      <td>Vest-Agder</td>\n",
 215 |        "      <td>Hægebostad kommune</td>\n",
 216 |        "    </tr>\n",
 217 |        "  </tbody>\n",
 218 |        "</table>\n",
 219 |        "</div>"
 220 |       ],
 221 |       "text/plain": [
 222 |        "   station_id station_code           station_name  region biolok_code  \\\n",
 223 |        "0          42     1003-2-4        Saudlandsvatnet       5         V-1   \n",
 224 |        "1         192      1014-12              Sognevatn       4        IV-9   \n",
 225 |        "2         182      1014-25           Drivenesvatn       4        IV-8   \n",
 226 |        "3         166       1018-4         Kleivsetvannet       4       IV-10   \n",
 227 |        "4         118      1034-19  Indre Espelandsvatnet       5         V-2   \n",
 228 |        "\n",
 229 |        "   nve_vatn_nr  elevation_m       fylke             kommune  \n",
 230 |        "0        21894        106.0  Vest-Agder     Farsund kommune  \n",
 231 |        "1        11078        267.0  Vest-Agder    Vennesla kommune  \n",
 232 |        "2        11147        176.0  Vest-Agder    Vennesla kommune  \n",
 233 |        "3        11592         93.0  Vest-Agder       Søgne kommune  \n",
 234 |        "4        11095        389.0  Vest-Agder  Hægebostad kommune  "
 235 |       ]
 236 |      },
 237 |      "execution_count": 4,
 238 |      "metadata": {},
 239 |      "output_type": "execute_result"
 240 |     }
 241 |    ],
 242 |    "source": [
 243 |     "# Read stations\n",
 244 |     "stn_df = pd.read_excel('../project_overview_from_lbs.xlsx',\n",
 245 |     "                       sheet_name='stations')\n",
 246 |     "stn_df.head()"
 247 |    ]
 248 |   },
 249 |   {
 250 |    "cell_type": "code",
 251 |    "execution_count": 5,
 252 |    "metadata": {},
 253 |    "outputs": [],
 254 |    "source": [
 255 |     "## Refromat for adding to database\n",
 256 |     "#stn_df2 = stn_df.copy()\n",
 257 |     "#stn_df2['project_id'] = 4490\n",
 258 |     "#stn_df2['active'] = 'Y'\n",
 259 |     "#stn_df2 = stn_df2[['station_id', 'project_id', 'active', 'biolok_code']]\n",
 260 |     "#stn_df2.rename({'biolok_code':'station_code'}, axis=1, inplace=True)\n",
 261 |     "#\n",
 262 |     "## Write to db\n",
 263 |     "#stn_df2.to_sql('projects_stations', \n",
 264 |     "#               eng, \n",
 265 |     "#               schema='RESA2', \n",
 266 |     "#               if_exists='append', \n",
 267 |     "#               index=False,\n",
 268 |     "#              )"
 269 |    ]
 270 |   },
 271 |   {
 272 |    "cell_type": "markdown",
 273 |    "metadata": {},
 274 |    "source": [
 275 |     "## 3. Create a new sample selection"
 276 |    ]
 277 |   },
 278 |   {
 279 |    "cell_type": "code",
 280 |    "execution_count": 6,
 281 |    "metadata": {},
 282 |    "outputs": [],
 283 |    "source": [
 284 |     "## Create sample selection\n",
 285 |     "#sql = (\"INSERT INTO resa2.sample_selection_definitions \"\n",
 286 |     "#       \"  (sample_selection_id, project_id, name) \"\n",
 287 |     "#       \"VALUES \"\n",
 288 |     "#       \"  (66, 4490, 'Biolok (start to 2018)')\"\n",
 289 |     "#      )\n",
 290 |     "#eng.execute(sql)"
 291 |    ]
 292 |   },
 293 |   {
 294 |    "cell_type": "markdown",
 295 |    "metadata": {},
 296 |    "source": [
 297 |     "## 4. Add pre-2015 water samples\n",
 298 |     "\n",
 299 |     "The code below first queries all water samples associated with the 2015 report, which includes two stations that are no longer part of the project. Next, the code queries *all* water samples in the database associated with the 42 stations that *are* in the current project, and then calculates the intersection of these two sets. This produces a list of pre-2015 samples to be transferred.\n",
 300 |     "\n",
 301 |     "The pre-2015 samples are associated with `SAMPLE_SELECTION_ID` 62."
 302 |    ]
 303 |   },
 304 |   {
 305 |    "cell_type": "code",
 306 |    "execution_count": 7,
 307 |    "metadata": {},
 308 |    "outputs": [
 309 |     {
 310 |      "name": "stdout",
 311 |      "output_type": "stream",
 312 |      "text": [
 313 |       "1566\n"
 314 |      ]
 315 |     },
 316 |     {
 317 |      "data": {
 318 |       "text/html": [
 319 |        "<div>\n",
 320 |        "<style scoped>\n",
 321 |        "    .dataframe tbody tr th:only-of-type {\n",
 322 |        "        vertical-align: middle;\n",
 323 |        "    }\n",
 324 |        "\n",
 325 |        "    .dataframe tbody tr th {\n",
 326 |        "        vertical-align: top;\n",
 327 |        "    }\n",
 328 |        "\n",
 329 |        "    .dataframe thead th {\n",
 330 |        "        text-align: right;\n",
 331 |        "    }\n",
 332 |        "</style>\n",
 333 |        "<table border=\"1\" class=\"dataframe\">\n",
 334 |        "  <thead>\n",
 335 |        "    <tr style=\"text-align: right;\">\n",
 336 |        "      <th></th>\n",
 337 |        "      <th>water_sample_id</th>\n",
 338 |        "      <th>sample_selection_id</th>\n",
 339 |        "    </tr>\n",
 340 |        "  </thead>\n",
 341 |        "  <tbody>\n",
 342 |        "    <tr>\n",
 343 |        "      <th>0</th>\n",
 344 |        "      <td>273550</td>\n",
 345 |        "      <td>66</td>\n",
 346 |        "    </tr>\n",
 347 |        "    <tr>\n",
 348 |        "      <th>1</th>\n",
 349 |        "      <td>273552</td>\n",
 350 |        "      <td>66</td>\n",
 351 |        "    </tr>\n",
 352 |        "    <tr>\n",
 353 |        "      <th>2</th>\n",
 354 |        "      <td>532542</td>\n",
 355 |        "      <td>66</td>\n",
 356 |        "    </tr>\n",
 357 |        "    <tr>\n",
 358 |        "      <th>3</th>\n",
 359 |        "      <td>532544</td>\n",
 360 |        "      <td>66</td>\n",
 361 |        "    </tr>\n",
 362 |        "    <tr>\n",
 363 |        "      <th>4</th>\n",
 364 |        "      <td>532545</td>\n",
 365 |        "      <td>66</td>\n",
 366 |        "    </tr>\n",
 367 |        "  </tbody>\n",
 368 |        "</table>\n",
 369 |        "</div>"
 370 |       ],
 371 |       "text/plain": [
 372 |        "   water_sample_id  sample_selection_id\n",
 373 |        "0           273550                   66\n",
 374 |        "1           273552                   66\n",
 375 |        "2           532542                   66\n",
 376 |        "3           532544                   66\n",
 377 |        "4           532545                   66"
 378 |       ]
 379 |      },
 380 |      "execution_count": 7,
 381 |      "metadata": {},
 382 |      "output_type": "execute_result"
 383 |     }
 384 |    ],
 385 |    "source": [
 386 |     "# Get WS IDs for pre-2015 stations\n",
 387 |     "sql = (\"SELECT water_sample_id FROM resa2.sample_selections \"\n",
 388 |     "       \"WHERE sample_selection_id = 62\")\n",
 389 |     "pre2015_df = pd.read_sql(sql, eng)\n",
 390 |     "\n",
 391 |     "# Get all WS in db for stations in 2018 project\n",
 392 |     "bind_pars = ','.join('%d' % i for i in stn_df['station_id'])\n",
 393 |     "sql = (\"SELECT water_sample_id FROM resa2.water_samples \"\n",
 394 |     "       \"WHERE station_id IN (%s)\" % bind_pars)\n",
 395 |     "all_df = pd.read_sql(sql, eng)\n",
 396 |     "\n",
 397 |     "# Compute intersection\n",
 398 |     "ws_ids = list(set(pre2015_df['water_sample_id']).intersection(set(all_df['water_sample_id'])))\n",
 399 |     "\n",
 400 |     "# Build df\n",
 401 |     "ws_df = pd.DataFrame({'water_sample_id':ws_ids})\n",
 402 |     "ws_df['sample_selection_id'] = 66\n",
 403 |     "print(len(ws_df))\n",
 404 |     "\n",
 405 |     "ws_df.head()"
 406 |    ]
 407 |   },
 408 |   {
 409 |    "cell_type": "code",
 410 |    "execution_count": 8,
 411 |    "metadata": {},
 412 |    "outputs": [],
 413 |    "source": [
 414 |     "## Write to db\n",
 415 |     "#ws_df.to_sql('sample_selections', \n",
 416 |     "#             eng, \n",
 417 |     "#             schema='RESA2', \n",
 418 |     "#             if_exists='append', \n",
 419 |     "#             index=False,\n",
 420 |     "#            )"
 421 |    ]
 422 |   },
 423 |   {
 424 |    "cell_type": "markdown",
 425 |    "metadata": {},
 426 |    "source": [
 427 |     "## 5. Check whether all non-Faun data are already in RESA\n",
 428 |     "\n",
 429 |     "Liv Bente's Excel file here\n",
 430 |     "\n",
 431 |     "    K:\\Prosjekter\\langtransporterte forurensninger\\O-190033-7 BIOLOK_rapp 2014-18\\Samlede prøver ulike kilder_til RESA_JES_nov19.xlsx\n",
 432 |     "    \n",
 433 |     "inludes a worksheet named `Data fra AquaM`, which lists water chemistry data that should be taken from AM. However, it looks as though most of these samples are already available in RESA. I've created a tidied version of Liv Bente's AM samples list in the `lbs_am_samples` worksheet of `../project_overview_from_lbs.xlsx`. The code below loops over these to see whether they can be identified RESA instead.\n",
 434 |     "\n",
 435 |     "**Note:** Initially, around 30 water samples could not be identified. Most of these were due to missing links iin the `NIVADATABASE.DATASOURCE_STATION` table, which I have now added. In addition:\n",
 436 |     "\n",
 437 |     " * AM station 26199 (Storbørja) was incorrectly linked to RESA ID 3042 (Svartbørja)\n",
 438 |     " \n",
 439 |     " * One sample from Rondvatnet (AM ID 49204; RESA ID 12712) had the date incorrectly assigned in RESA: the date was given as 13.07.2017 in AM, but 13.06.2017 in RESA. I will assume the AM date is correct\n",
 440 |     " \n",
 441 |     "Having corrected the above issues, all samples in Liv Bente's `Data fra AquaM` worksheet can now be identified in RESA."
 442 |    ]
 443 |   },
 444 |   {
 445 |    "cell_type": "code",
 446 |    "execution_count": 9,
 447 |    "metadata": {},
 448 |    "outputs": [
 449 |     {
 450 |      "data": {
 451 |       "text/html": [
 452 |        "<div>\n",
 453 |        "<style scoped>\n",
 454 |        "    .dataframe tbody tr th:only-of-type {\n",
 455 |        "        vertical-align: middle;\n",
 456 |        "    }\n",
 457 |        "\n",
 458 |        "    .dataframe tbody tr th {\n",
 459 |        "        vertical-align: top;\n",
 460 |        "    }\n",
 461 |        "\n",
 462 |        "    .dataframe thead th {\n",
 463 |        "        text-align: right;\n",
 464 |        "    }\n",
 465 |        "</style>\n",
 466 |        "<table border=\"1\" class=\"dataframe\">\n",
 467 |        "  <thead>\n",
 468 |        "    <tr style=\"text-align: right;\">\n",
 469 |        "      <th></th>\n",
 470 |        "      <th>am_id</th>\n",
 471 |        "      <th>resa_code</th>\n",
 472 |        "      <th>am_name</th>\n",
 473 |        "      <th>resa_name</th>\n",
 474 |        "      <th>date</th>\n",
 475 |        "      <th>depth1</th>\n",
 476 |        "      <th>depth2</th>\n",
 477 |        "    </tr>\n",
 478 |        "  </thead>\n",
 479 |        "  <tbody>\n",
 480 |        "    <tr>\n",
 481 |        "      <th>0</th>\n",
 482 |        "      <td>8614</td>\n",
 483 |        "      <td>430-I-1</td>\n",
 484 |        "      <td>Atnsjøen</td>\n",
 485 |        "      <td>Atnsjøen</td>\n",
 486 |        "      <td>2018-06-10 00:00:00</td>\n",
 487 |        "      <td>0.5</td>\n",
 488 |        "      <td>0.5</td>\n",
 489 |        "    </tr>\n",
 490 |        "    <tr>\n",
 491 |        "      <th>1</th>\n",
 492 |        "      <td>8614</td>\n",
 493 |        "      <td>430-I-1</td>\n",
 494 |        "      <td>Atnsjøen</td>\n",
 495 |        "      <td>Atnsjøen</td>\n",
 496 |        "      <td>2018-08-09 00:00:00</td>\n",
 497 |        "      <td>0.5</td>\n",
 498 |        "      <td>0.5</td>\n",
 499 |        "    </tr>\n",
 500 |        "    <tr>\n",
 501 |        "      <th>2</th>\n",
 502 |        "      <td>8614</td>\n",
 503 |        "      <td>430-I-1</td>\n",
 504 |        "      <td>Atnsjøen</td>\n",
 505 |        "      <td>Atnsjøen</td>\n",
 506 |        "      <td>2018-09-04 00:00:00</td>\n",
 507 |        "      <td>0.5</td>\n",
 508 |        "      <td>0.5</td>\n",
 509 |        "    </tr>\n",
 510 |        "    <tr>\n",
 511 |        "      <th>3</th>\n",
 512 |        "      <td>26075</td>\n",
 513 |        "      <td>432-1-26</td>\n",
 514 |        "      <td>Måsåbutjønna</td>\n",
 515 |        "      <td>Måsabutjørna</td>\n",
 516 |        "      <td>2018-06-14 13:00:00</td>\n",
 517 |        "      <td>0.5</td>\n",
 518 |        "      <td>0.5</td>\n",
 519 |        "    </tr>\n",
 520 |        "    <tr>\n",
 521 |        "      <th>4</th>\n",
 522 |        "      <td>26075</td>\n",
 523 |        "      <td>432-1-26</td>\n",
 524 |        "      <td>Måsåbutjønna</td>\n",
 525 |        "      <td>Måsabutjørna</td>\n",
 526 |        "      <td>2018-08-28 00:00:00</td>\n",
 527 |        "      <td>0.5</td>\n",
 528 |        "      <td>0.5</td>\n",
 529 |        "    </tr>\n",
 530 |        "  </tbody>\n",
 531 |        "</table>\n",
 532 |        "</div>"
 533 |       ],
 534 |       "text/plain": [
 535 |        "   am_id resa_code       am_name     resa_name                date  depth1  \\\n",
 536 |        "0   8614   430-I-1      Atnsjøen      Atnsjøen 2018-06-10 00:00:00     0.5   \n",
 537 |        "1   8614   430-I-1      Atnsjøen      Atnsjøen 2018-08-09 00:00:00     0.5   \n",
 538 |        "2   8614   430-I-1      Atnsjøen      Atnsjøen 2018-09-04 00:00:00     0.5   \n",
 539 |        "3  26075  432-1-26  Måsåbutjønna  Måsabutjørna 2018-06-14 13:00:00     0.5   \n",
 540 |        "4  26075  432-1-26  Måsåbutjønna  Måsabutjørna 2018-08-28 00:00:00     0.5   \n",
 541 |        "\n",
 542 |        "   depth2  \n",
 543 |        "0     0.5  \n",
 544 |        "1     0.5  \n",
 545 |        "2     0.5  \n",
 546 |        "3     0.5  \n",
 547 |        "4     0.5  "
 548 |       ]
 549 |      },
 550 |      "execution_count": 9,
 551 |      "metadata": {},
 552 |      "output_type": "execute_result"
 553 |     }
 554 |    ],
 555 |    "source": [
 556 |     "# Read list of AM samples\n",
 557 |     "am_ws = pd.read_excel('../project_overview_from_lbs.xlsx',\n",
 558 |     "                      sheet_name='lbs_am_samples')\n",
 559 |     "am_ws.head()"
 560 |    ]
 561 |   },
 562 |   {
 563 |    "cell_type": "code",
 564 |    "execution_count": 10,
 565 |    "metadata": {},
 566 |    "outputs": [
 567 |     {
 568 |      "data": {
 569 |       "text/html": [
 570 |        "<div>\n",
 571 |        "<style scoped>\n",
 572 |        "    .dataframe tbody tr th:only-of-type {\n",
 573 |        "        vertical-align: middle;\n",
 574 |        "    }\n",
 575 |        "\n",
 576 |        "    .dataframe tbody tr th {\n",
 577 |        "        vertical-align: top;\n",
 578 |        "    }\n",
 579 |        "\n",
 580 |        "    .dataframe thead th {\n",
 581 |        "        text-align: right;\n",
 582 |        "    }\n",
 583 |        "</style>\n",
 584 |        "<table border=\"1\" class=\"dataframe\">\n",
 585 |        "  <thead>\n",
 586 |        "    <tr style=\"text-align: right;\">\n",
 587 |        "      <th></th>\n",
 588 |        "      <th>am_id</th>\n",
 589 |        "      <th>resa_code</th>\n",
 590 |        "      <th>am_name</th>\n",
 591 |        "      <th>resa_name</th>\n",
 592 |        "      <th>date</th>\n",
 593 |        "      <th>depth1</th>\n",
 594 |        "      <th>depth2</th>\n",
 595 |        "      <th>resa_ws_id</th>\n",
 596 |        "    </tr>\n",
 597 |        "  </thead>\n",
 598 |        "  <tbody>\n",
 599 |        "    <tr>\n",
 600 |        "      <th>0</th>\n",
 601 |        "      <td>8614</td>\n",
 602 |        "      <td>430-I-1</td>\n",
 603 |        "      <td>Atnsjøen</td>\n",
 604 |        "      <td>Atnsjøen</td>\n",
 605 |        "      <td>2018-06-10 00:00:00</td>\n",
 606 |        "      <td>0.5</td>\n",
 607 |        "      <td>0.5</td>\n",
 608 |        "      <td>661404</td>\n",
 609 |        "    </tr>\n",
 610 |        "    <tr>\n",
 611 |        "      <th>1</th>\n",
 612 |        "      <td>8614</td>\n",
 613 |        "      <td>430-I-1</td>\n",
 614 |        "      <td>Atnsjøen</td>\n",
 615 |        "      <td>Atnsjøen</td>\n",
 616 |        "      <td>2018-08-09 00:00:00</td>\n",
 617 |        "      <td>0.5</td>\n",
 618 |        "      <td>0.5</td>\n",
 619 |        "      <td>661558</td>\n",
 620 |        "    </tr>\n",
 621 |        "    <tr>\n",
 622 |        "      <th>2</th>\n",
 623 |        "      <td>8614</td>\n",
 624 |        "      <td>430-I-1</td>\n",
 625 |        "      <td>Atnsjøen</td>\n",
 626 |        "      <td>Atnsjøen</td>\n",
 627 |        "      <td>2018-09-04 00:00:00</td>\n",
 628 |        "      <td>0.5</td>\n",
 629 |        "      <td>0.5</td>\n",
 630 |        "      <td>661844</td>\n",
 631 |        "    </tr>\n",
 632 |        "    <tr>\n",
 633 |        "      <th>3</th>\n",
 634 |        "      <td>26075</td>\n",
 635 |        "      <td>432-1-26</td>\n",
 636 |        "      <td>Måsåbutjønna</td>\n",
 637 |        "      <td>Måsabutjørna</td>\n",
 638 |        "      <td>2018-06-14 13:00:00</td>\n",
 639 |        "      <td>0.5</td>\n",
 640 |        "      <td>0.5</td>\n",
 641 |        "      <td>661408</td>\n",
 642 |        "    </tr>\n",
 643 |        "    <tr>\n",
 644 |        "      <th>4</th>\n",
 645 |        "      <td>26075</td>\n",
 646 |        "      <td>432-1-26</td>\n",
 647 |        "      <td>Måsåbutjønna</td>\n",
 648 |        "      <td>Måsabutjørna</td>\n",
 649 |        "      <td>2018-08-28 00:00:00</td>\n",
 650 |        "      <td>0.5</td>\n",
 651 |        "      <td>0.5</td>\n",
 652 |        "      <td>661679</td>\n",
 653 |        "    </tr>\n",
 654 |        "  </tbody>\n",
 655 |        "</table>\n",
 656 |        "</div>"
 657 |       ],
 658 |       "text/plain": [
 659 |        "   am_id resa_code       am_name     resa_name                date  depth1  \\\n",
 660 |        "0   8614   430-I-1      Atnsjøen      Atnsjøen 2018-06-10 00:00:00     0.5   \n",
 661 |        "1   8614   430-I-1      Atnsjøen      Atnsjøen 2018-08-09 00:00:00     0.5   \n",
 662 |        "2   8614   430-I-1      Atnsjøen      Atnsjøen 2018-09-04 00:00:00     0.5   \n",
 663 |        "3  26075  432-1-26  Måsåbutjønna  Måsabutjørna 2018-06-14 13:00:00     0.5   \n",
 664 |        "4  26075  432-1-26  Måsåbutjønna  Måsabutjørna 2018-08-28 00:00:00     0.5   \n",
 665 |        "\n",
 666 |        "   depth2  resa_ws_id  \n",
 667 |        "0     0.5      661404  \n",
 668 |        "1     0.5      661558  \n",
 669 |        "2     0.5      661844  \n",
 670 |        "3     0.5      661408  \n",
 671 |        "4     0.5      661679  "
 672 |       ]
 673 |      },
 674 |      "execution_count": 10,
 675 |      "metadata": {},
 676 |      "output_type": "execute_result"
 677 |     }
 678 |    ],
 679 |    "source": [
 680 |     "# Loop over data\n",
 681 |     "ws_list = []\n",
 682 |     "for idx, row in am_ws.iterrows():\n",
 683 |     "    # Get station ID\n",
 684 |     "    stn_code = row['resa_code']\n",
 685 |     "    stn_id = stn_df.query('station_code == @stn_code')['station_id'].iloc[0]\n",
 686 |     "    \n",
 687 |     "    # Query RESA db\n",
 688 |     "    par_dict = {'stn_id':stn_id.item(),\n",
 689 |     "                'sample_date':  row['date'].date(),\n",
 690 |     "                'depth1':row['depth1'],\n",
 691 |     "                'depth2':row['depth2'],\n",
 692 |     "               }\n",
 693 |     "    \n",
 694 |     "    sql = (\"SELECT * FROM resa2.water_samples \"\n",
 695 |     "           \"WHERE station_id = :stn_id \"\n",
 696 |     "           \"AND TRUNC(sample_date) = :sample_date \"\n",
 697 |     "           \"AND depth1 = :depth1 \"\n",
 698 |     "           \"AND depth2 = :depth2\")\n",
 699 |     "    \n",
 700 |     "    res = pd.read_sql(sql, con=eng, params=par_dict)\n",
 701 |     "    \n",
 702 |     "    if len(res) == 1:\n",
 703 |     "        ws_list.append(res['water_sample_id'].iloc[0])\n",
 704 |     "    elif len(res) == 0:\n",
 705 |     "        ws_list.append(np.nan)\n",
 706 |     "    else:\n",
 707 |     "        print(stn_code, row['date'].date(), len(res))\n",
 708 |     "        ws_list.append(-1)\n",
 709 |     "\n",
 710 |     "am_ws['resa_ws_id'] = ws_list\n",
 711 |     "am_ws.head()"
 712 |    ]
 713 |   },
 714 |   {
 715 |    "cell_type": "code",
 716 |    "execution_count": 11,
 717 |    "metadata": {},
 718 |    "outputs": [
 719 |     {
 720 |      "data": {
 721 |       "text/plain": [
 722 |        "am_id         85\n",
 723 |        "resa_code     85\n",
 724 |        "am_name       85\n",
 725 |        "resa_name     85\n",
 726 |        "date          85\n",
 727 |        "depth1        85\n",
 728 |        "depth2        85\n",
 729 |        "resa_ws_id    85\n",
 730 |        "dtype: int64"
 731 |       ]
 732 |      },
 733 |      "execution_count": 11,
 734 |      "metadata": {},
 735 |      "output_type": "execute_result"
 736 |     }
 737 |    ],
 738 |    "source": [
 739 |     "am_ws.count()"
 740 |    ]
 741 |   },
 742 |   {
 743 |    "cell_type": "code",
 744 |    "execution_count": 12,
 745 |    "metadata": {},
 746 |    "outputs": [
 747 |     {
 748 |      "data": {
 749 |       "text/html": [
 750 |        "<div>\n",
 751 |        "<style scoped>\n",
 752 |        "    .dataframe tbody tr th:only-of-type {\n",
 753 |        "        vertical-align: middle;\n",
 754 |        "    }\n",
 755 |        "\n",
 756 |        "    .dataframe tbody tr th {\n",
 757 |        "        vertical-align: top;\n",
 758 |        "    }\n",
 759 |        "\n",
 760 |        "    .dataframe thead th {\n",
 761 |        "        text-align: right;\n",
 762 |        "    }\n",
 763 |        "</style>\n",
 764 |        "<table border=\"1\" class=\"dataframe\">\n",
 765 |        "  <thead>\n",
 766 |        "    <tr style=\"text-align: right;\">\n",
 767 |        "      <th></th>\n",
 768 |        "      <th>am_id</th>\n",
 769 |        "      <th>resa_code</th>\n",
 770 |        "      <th>am_name</th>\n",
 771 |        "      <th>resa_name</th>\n",
 772 |        "      <th>date</th>\n",
 773 |        "      <th>depth1</th>\n",
 774 |        "      <th>depth2</th>\n",
 775 |        "      <th>resa_ws_id</th>\n",
 776 |        "    </tr>\n",
 777 |        "  </thead>\n",
 778 |        "  <tbody>\n",
 779 |        "  </tbody>\n",
 780 |        "</table>\n",
 781 |        "</div>"
 782 |       ],
 783 |       "text/plain": [
 784 |        "Empty DataFrame\n",
 785 |        "Columns: [am_id, resa_code, am_name, resa_name, date, depth1, depth2, resa_ws_id]\n",
 786 |        "Index: []"
 787 |       ]
 788 |      },
 789 |      "execution_count": 12,
 790 |      "metadata": {},
 791 |      "output_type": "execute_result"
 792 |     }
 793 |    ],
 794 |    "source": [
 795 |     "not_found_df = am_ws[pd.isna(am_ws['resa_ws_id'])]\n",
 796 |     "not_found_df"
 797 |    ]
 798 |   },
 799 |   {
 800 |    "cell_type": "code",
 801 |    "execution_count": 13,
 802 |    "metadata": {},
 803 |    "outputs": [
 804 |     {
 805 |      "name": "stdout",
 806 |      "output_type": "stream",
 807 |      "text": [
 808 |       "[]\n"
 809 |      ]
 810 |     }
 811 |    ],
 812 |    "source": [
 813 |     "am_list = list(not_found_df['am_id'].unique().astype(str))\n",
 814 |     "print(am_list)\n",
 815 |     "if len(am_list) > 0:\n",
 816 |     "    am_ids = ','.join(am_list)\n",
 817 |     "    sql = text(f\"SELECT * \"\n",
 818 |     "               f\"FROM nivadatabase.datasource_station \"\n",
 819 |     "               f\"WHERE station_id IN ({am_ids})\")\n",
 820 |     "    pd.read_sql(sql, eng)"
 821 |    ]
 822 |   },
 823 |   {
 824 |    "cell_type": "markdown",
 825 |    "metadata": {},
 826 |    "source": [
 827 |     "## 6. Add post-2014 water samples (non-FAUN)\n",
 828 |     "\n",
 829 |     "**Note:** This code has not yet been run fully. Once the issues with Storbørja and Svartbørja have been solved, it can be run again.\n",
 830 |     "\n",
 831 |     "All of the non-FAUN samples from 2015 to 2018 should now be available in RESA (i.e. everything from Liv Bente's `Data fra RESA 2015-2018 mm` and `Data fra AquaM` worksheets). All these samples are listed in tidied form in the `am_resa_2015-2018` worksheet of `../project_overview_from_lbs.xlsx`. The code below identifies RESA sample IDs for each sample and checks that all samples can be found. They are then associated with `SAMPLE_SELECTION_ID` 66 in RESA."
 832 |    ]
 833 |   },
 834 |   {
 835 |    "cell_type": "code",
 836 |    "execution_count": 14,
 837 |    "metadata": {},
 838 |    "outputs": [
 839 |     {
 840 |      "data": {
 841 |       "text/html": [
 842 |        "<div>\n",
 843 |        "<style scoped>\n",
 844 |        "    .dataframe tbody tr th:only-of-type {\n",
 845 |        "        vertical-align: middle;\n",
 846 |        "    }\n",
 847 |        "\n",
 848 |        "    .dataframe tbody tr th {\n",
 849 |        "        vertical-align: top;\n",
 850 |        "    }\n",
 851 |        "\n",
 852 |        "    .dataframe thead th {\n",
 853 |        "        text-align: right;\n",
 854 |        "    }\n",
 855 |        "</style>\n",
 856 |        "<table border=\"1\" class=\"dataframe\">\n",
 857 |        "  <thead>\n",
 858 |        "    <tr style=\"text-align: right;\">\n",
 859 |        "      <th></th>\n",
 860 |        "      <th>station_id</th>\n",
 861 |        "      <th>date</th>\n",
 862 |        "      <th>depth1</th>\n",
 863 |        "      <th>depth2</th>\n",
 864 |        "    </tr>\n",
 865 |        "  </thead>\n",
 866 |        "  <tbody>\n",
 867 |        "    <tr>\n",
 868 |        "      <th>0</th>\n",
 869 |        "      <td>16131</td>\n",
 870 |        "      <td>2015-06-11 08:00:00</td>\n",
 871 |        "      <td>0.0</td>\n",
 872 |        "      <td>0.0</td>\n",
 873 |        "    </tr>\n",
 874 |        "    <tr>\n",
 875 |        "      <th>1</th>\n",
 876 |        "      <td>16131</td>\n",
 877 |        "      <td>2015-08-04 08:30:00</td>\n",
 878 |        "      <td>0.0</td>\n",
 879 |        "      <td>0.0</td>\n",
 880 |        "    </tr>\n",
 881 |        "    <tr>\n",
 882 |        "      <th>2</th>\n",
 883 |        "      <td>16131</td>\n",
 884 |        "      <td>2015-08-30 08:30:00</td>\n",
 885 |        "      <td>0.0</td>\n",
 886 |        "      <td>0.0</td>\n",
 887 |        "    </tr>\n",
 888 |        "    <tr>\n",
 889 |        "      <th>3</th>\n",
 890 |        "      <td>16131</td>\n",
 891 |        "      <td>2015-10-04 09:00:00</td>\n",
 892 |        "      <td>0.0</td>\n",
 893 |        "      <td>0.0</td>\n",
 894 |        "    </tr>\n",
 895 |        "    <tr>\n",
 896 |        "      <th>4</th>\n",
 897 |        "      <td>16131</td>\n",
 898 |        "      <td>2016-06-08 00:00:00</td>\n",
 899 |        "      <td>0.0</td>\n",
 900 |        "      <td>10.0</td>\n",
 901 |        "    </tr>\n",
 902 |        "  </tbody>\n",
 903 |        "</table>\n",
 904 |        "</div>"
 905 |       ],
 906 |       "text/plain": [
 907 |        "   station_id                date  depth1  depth2\n",
 908 |        "0       16131 2015-06-11 08:00:00     0.0     0.0\n",
 909 |        "1       16131 2015-08-04 08:30:00     0.0     0.0\n",
 910 |        "2       16131 2015-08-30 08:30:00     0.0     0.0\n",
 911 |        "3       16131 2015-10-04 09:00:00     0.0     0.0\n",
 912 |        "4       16131 2016-06-08 00:00:00     0.0    10.0"
 913 |       ]
 914 |      },
 915 |      "execution_count": 14,
 916 |      "metadata": {},
 917 |      "output_type": "execute_result"
 918 |     }
 919 |    ],
 920 |    "source": [
 921 |     "# Read list of post-2014 non-FAUN samples\n",
 922 |     "samp_df = pd.read_excel('../project_overview_from_lbs.xlsx',\n",
 923 |     "                        sheet_name='am_resa_2015-2018')\n",
 924 |     "samp_df.head()"
 925 |    ]
 926 |   },
 927 |   {
 928 |    "cell_type": "code",
 929 |    "execution_count": 15,
 930 |    "metadata": {},
 931 |    "outputs": [
 932 |     {
 933 |      "data": {
 934 |       "text/html": [
 935 |        "<div>\n",
 936 |        "<style scoped>\n",
 937 |        "    .dataframe tbody tr th:only-of-type {\n",
 938 |        "        vertical-align: middle;\n",
 939 |        "    }\n",
 940 |        "\n",
 941 |        "    .dataframe tbody tr th {\n",
 942 |        "        vertical-align: top;\n",
 943 |        "    }\n",
 944 |        "\n",
 945 |        "    .dataframe thead th {\n",
 946 |        "        text-align: right;\n",
 947 |        "    }\n",
 948 |        "</style>\n",
 949 |        "<table border=\"1\" class=\"dataframe\">\n",
 950 |        "  <thead>\n",
 951 |        "    <tr style=\"text-align: right;\">\n",
 952 |        "      <th></th>\n",
 953 |        "      <th>station_id</th>\n",
 954 |        "      <th>date</th>\n",
 955 |        "      <th>depth1</th>\n",
 956 |        "      <th>depth2</th>\n",
 957 |        "      <th>water_sample_id</th>\n",
 958 |        "    </tr>\n",
 959 |        "  </thead>\n",
 960 |        "  <tbody>\n",
 961 |        "    <tr>\n",
 962 |        "      <th>0</th>\n",
 963 |        "      <td>16131</td>\n",
 964 |        "      <td>2015-06-11 08:00:00</td>\n",
 965 |        "      <td>0.0</td>\n",
 966 |        "      <td>0.0</td>\n",
 967 |        "      <td>638920</td>\n",
 968 |        "    </tr>\n",
 969 |        "    <tr>\n",
 970 |        "      <th>1</th>\n",
 971 |        "      <td>16131</td>\n",
 972 |        "      <td>2015-08-04 08:30:00</td>\n",
 973 |        "      <td>0.0</td>\n",
 974 |        "      <td>0.0</td>\n",
 975 |        "      <td>642959</td>\n",
 976 |        "    </tr>\n",
 977 |        "    <tr>\n",
 978 |        "      <th>2</th>\n",
 979 |        "      <td>16131</td>\n",
 980 |        "      <td>2015-08-30 08:30:00</td>\n",
 981 |        "      <td>0.0</td>\n",
 982 |        "      <td>0.0</td>\n",
 983 |        "      <td>640953</td>\n",
 984 |        "    </tr>\n",
 985 |        "    <tr>\n",
 986 |        "      <th>3</th>\n",
 987 |        "      <td>16131</td>\n",
 988 |        "      <td>2015-10-04 09:00:00</td>\n",
 989 |        "      <td>0.0</td>\n",
 990 |        "      <td>0.0</td>\n",
 991 |        "      <td>642399</td>\n",
 992 |        "    </tr>\n",
 993 |        "    <tr>\n",
 994 |        "      <th>4</th>\n",
 995 |        "      <td>16131</td>\n",
 996 |        "      <td>2016-06-08 00:00:00</td>\n",
 997 |        "      <td>0.0</td>\n",
 998 |        "      <td>10.0</td>\n",
 999 |        "      <td>652766</td>\n",
1000 |        "    </tr>\n",
1001 |        "  </tbody>\n",
1002 |        "</table>\n",
1003 |        "</div>"
1004 |       ],
1005 |       "text/plain": [
1006 |        "   station_id                date  depth1  depth2  water_sample_id\n",
1007 |        "0       16131 2015-06-11 08:00:00     0.0     0.0           638920\n",
1008 |        "1       16131 2015-08-04 08:30:00     0.0     0.0           642959\n",
1009 |        "2       16131 2015-08-30 08:30:00     0.0     0.0           640953\n",
1010 |        "3       16131 2015-10-04 09:00:00     0.0     0.0           642399\n",
1011 |        "4       16131 2016-06-08 00:00:00     0.0    10.0           652766"
1012 |       ]
1013 |      },
1014 |      "execution_count": 15,
1015 |      "metadata": {},
1016 |      "output_type": "execute_result"
1017 |     }
1018 |    ],
1019 |    "source": [
1020 |     "# Loop over data\n",
1021 |     "ws_list = []\n",
1022 |     "for idx, row in samp_df.iterrows():   \n",
1023 |     "    # Query RESA db\n",
1024 |     "    par_dict = {'stn_id':row['station_id'],\n",
1025 |     "                'sample_date':  row['date'].date(),\n",
1026 |     "                'depth1':row['depth1'],\n",
1027 |     "                'depth2':row['depth2'],\n",
1028 |     "               }\n",
1029 |     "    \n",
1030 |     "    sql = (\"SELECT * FROM resa2.water_samples \"\n",
1031 |     "           \"WHERE station_id = :stn_id \"\n",
1032 |     "           \"AND TRUNC(sample_date) = :sample_date \"\n",
1033 |     "           \"AND depth1 = :depth1 \"\n",
1034 |     "           \"AND depth2 = :depth2\")\n",
1035 |     "    \n",
1036 |     "    res = pd.read_sql(sql, con=eng, params=par_dict)\n",
1037 |     "    \n",
1038 |     "    if len(res) == 1:\n",
1039 |     "        ws_list.append(res['water_sample_id'].iloc[0])\n",
1040 |     "    elif len(res) == 0:\n",
1041 |     "        ws_list.append(np.nan)\n",
1042 |     "    else:\n",
1043 |     "        print(stn_code, row['date'].date(), len(res))\n",
1044 |     "        ws_list.append(-1)\n",
1045 |     "\n",
1046 |     "samp_df['water_sample_id'] = ws_list\n",
1047 |     "samp_df.head()"
1048 |    ]
1049 |   },
1050 |   {
1051 |    "cell_type": "code",
1052 |    "execution_count": 16,
1053 |    "metadata": {},
1054 |    "outputs": [
1055 |     {
1056 |      "data": {
1057 |       "text/plain": [
1058 |        "station_id         346\n",
1059 |        "date               346\n",
1060 |        "depth1             346\n",
1061 |        "depth2             346\n",
1062 |        "water_sample_id    346\n",
1063 |        "dtype: int64"
1064 |       ]
1065 |      },
1066 |      "execution_count": 16,
1067 |      "metadata": {},
1068 |      "output_type": "execute_result"
1069 |     }
1070 |    ],
1071 |    "source": [
1072 |     "samp_df.count()"
1073 |    ]
1074 |   },
1075 |   {
1076 |    "cell_type": "code",
1077 |    "execution_count": 17,
1078 |    "metadata": {},
1079 |    "outputs": [
1080 |     {
1081 |      "data": {
1082 |       "text/html": [
1083 |        "<div>\n",
1084 |        "<style scoped>\n",
1085 |        "    .dataframe tbody tr th:only-of-type {\n",
1086 |        "        vertical-align: middle;\n",
1087 |        "    }\n",
1088 |        "\n",
1089 |        "    .dataframe tbody tr th {\n",
1090 |        "        vertical-align: top;\n",
1091 |        "    }\n",
1092 |        "\n",
1093 |        "    .dataframe thead th {\n",
1094 |        "        text-align: right;\n",
1095 |        "    }\n",
1096 |        "</style>\n",
1097 |        "<table border=\"1\" class=\"dataframe\">\n",
1098 |        "  <thead>\n",
1099 |        "    <tr style=\"text-align: right;\">\n",
1100 |        "      <th></th>\n",
1101 |        "      <th>station_id</th>\n",
1102 |        "      <th>date</th>\n",
1103 |        "      <th>depth1</th>\n",
1104 |        "      <th>depth2</th>\n",
1105 |        "      <th>water_sample_id</th>\n",
1106 |        "    </tr>\n",
1107 |        "  </thead>\n",
1108 |        "  <tbody>\n",
1109 |        "  </tbody>\n",
1110 |        "</table>\n",
1111 |        "</div>"
1112 |       ],
1113 |       "text/plain": [
1114 |        "Empty DataFrame\n",
1115 |        "Columns: [station_id, date, depth1, depth2, water_sample_id]\n",
1116 |        "Index: []"
1117 |       ]
1118 |      },
1119 |      "execution_count": 17,
1120 |      "metadata": {},
1121 |      "output_type": "execute_result"
1122 |     }
1123 |    ],
1124 |    "source": [
1125 |     "not_found_df = samp_df[pd.isna(samp_df['water_sample_id'])]\n",
1126 |     "not_found_df"
1127 |    ]
1128 |   },
1129 |   {
1130 |    "cell_type": "code",
1131 |    "execution_count": 18,
1132 |    "metadata": {},
1133 |    "outputs": [],
1134 |    "source": [
1135 |     "## Add to sample selection\n",
1136 |     "#samp_df['sample_selection_id'] = 66\n",
1137 |     "#samp_df = samp_df[['water_sample_id', 'sample_selection_id']]\n",
1138 |     "#\n",
1139 |     "## Write to db\n",
1140 |     "#samp_df.to_sql('sample_selections', \n",
1141 |     "#               eng, \n",
1142 |     "#               schema='RESA2', \n",
1143 |     "#               if_exists='append', \n",
1144 |     "#               index=False,\n",
1145 |     "#              )"
1146 |    ]
1147 |   },
1148 |   {
1149 |    "cell_type": "markdown",
1150 |    "metadata": {},
1151 |    "source": [
1152 |     "## 7. Data from Faun\n",
1153 |     "\n",
1154 |     "The worksheet `faun` of `../project_overview_from_lbs.xlsx` list all the FAUN samples in Liv Bente's spreadsheet. I have also created a list of new methods with `LABORATORY=FAUN` in the worksheet `faun_methods`, which have been added to the database."
1155 |    ]
1156 |   },
1157 |   {
1158 |    "cell_type": "markdown",
1159 |    "metadata": {},
1160 |    "source": [
1161 |     "### 7.1. Link new method to parameters"
1162 |    ]
1163 |   },
1164 |   {
1165 |    "cell_type": "code",
1166 |    "execution_count": 19,
1167 |    "metadata": {},
1168 |    "outputs": [],
1169 |    "source": [
1170 |     "# Read methods from Excel\n",
1171 |     "meth_df = pd.read_excel('../project_overview_from_lbs.xlsx',\n",
1172 |     "                        sheet_name='faun_methods')\n",
1173 |     "\n",
1174 |     "# Get new method IDs from database\n",
1175 |     "sql = text(\"SELECT wc_method_id, name AS method_name \"\n",
1176 |     "           \"FROM resa2.wc_method_definitions \"\n",
1177 |     "           \"WHERE laboratory = 'FAUN'\")\n",
1178 |     "meth_id_df = pd.read_sql(sql, eng)\n",
1179 |     "\n",
1180 |     "# Join\n",
1181 |     "meth_df = pd.merge(meth_df, meth_id_df, how='left', on='method_name')\n",
1182 |     "\n",
1183 |     "# Add corr_fac = 1\n",
1184 |     "meth_df['conversion_factor'] = 1\n",
1185 |     "\n",
1186 |     "# Add to db\n",
1187 |     "par_meth_df = meth_df[['wc_parameter_id', 'wc_method_id', 'conversion_factor']]"
1188 |    ]
1189 |   },
1190 |   {
1191 |    "cell_type": "code",
1192 |    "execution_count": 20,
1193 |    "metadata": {},
1194 |    "outputs": [],
1195 |    "source": [
1196 |     "#par_meth_df.to_sql('wc_parameters_methods', \n",
1197 |     "#                   eng, \n",
1198 |     "#                   schema='RESA2', \n",
1199 |     "#                   if_exists='append', \n",
1200 |     "#                   index=False,\n",
1201 |     "#                  )"
1202 |    ]
1203 |   },
1204 |   {
1205 |    "cell_type": "markdown",
1206 |    "metadata": {},
1207 |    "source": [
1208 |     "### 7.2. Add water samples"
1209 |    ]
1210 |   },
1211 |   {
1212 |    "cell_type": "code",
1213 |    "execution_count": 21,
1214 |    "metadata": {},
1215 |    "outputs": [],
1216 |    "source": [
1217 |     "# Read FAUN data\n",
1218 |     "faun_df = pd.read_excel('../project_overview_from_lbs.xlsx',\n",
1219 |     "                        sheet_name='faun')\n",
1220 |     "\n",
1221 |     "# Add water samples\n",
1222 |     "ws_df = faun_df[['station_id', 'sample_date', 'depth1', 'depth2']]"
1223 |    ]
1224 |   },
1225 |   {
1226 |    "cell_type": "code",
1227 |    "execution_count": 22,
1228 |    "metadata": {},
1229 |    "outputs": [],
1230 |    "source": [
1231 |     "#ws_df.to_sql('water_samples', \n",
1232 |     "#             eng, \n",
1233 |     "#             schema='RESA2', \n",
1234 |     "#             if_exists='append', \n",
1235 |     "#             index=False,\n",
1236 |     "#            )"
1237 |    ]
1238 |   },
1239 |   {
1240 |    "cell_type": "markdown",
1241 |    "metadata": {},
1242 |    "source": [
1243 |     "### 7.3. Add water chemistry"
1244 |    ]
1245 |   },
1246 |   {
1247 |    "cell_type": "code",
1248 |    "execution_count": 23,
1249 |    "metadata": {},
1250 |    "outputs": [],
1251 |    "source": [
1252 |     "def f(row):\n",
1253 |     "    \"\"\" Function to deal with flags.\n",
1254 |     "    \"\"\"\n",
1255 |     "    if '<' in row['value']:\n",
1256 |     "        val = '<'\n",
1257 |     "    elif '>' in row['value']:\n",
1258 |     "        val = '>'\n",
1259 |     "    else:\n",
1260 |     "        val = np.nan\n",
1261 |     "    return val"
1262 |    ]
1263 |   },
1264 |   {
1265 |    "cell_type": "code",
1266 |    "execution_count": 24,
1267 |    "metadata": {},
1268 |    "outputs": [
1269 |     {
1270 |      "data": {
1271 |       "text/html": [
1272 |        "<div>\n",
1273 |        "<style scoped>\n",
1274 |        "    .dataframe tbody tr th:only-of-type {\n",
1275 |        "        vertical-align: middle;\n",
1276 |        "    }\n",
1277 |        "\n",
1278 |        "    .dataframe tbody tr th {\n",
1279 |        "        vertical-align: top;\n",
1280 |        "    }\n",
1281 |        "\n",
1282 |        "    .dataframe thead th {\n",
1283 |        "        text-align: right;\n",
1284 |        "    }\n",
1285 |        "</style>\n",
1286 |        "<table border=\"1\" class=\"dataframe\">\n",
1287 |        "  <thead>\n",
1288 |        "    <tr style=\"text-align: right;\">\n",
1289 |        "      <th></th>\n",
1290 |        "      <th>sample_id</th>\n",
1291 |        "      <th>method_id</th>\n",
1292 |        "      <th>value</th>\n",
1293 |        "      <th>flag1</th>\n",
1294 |        "      <th>approved</th>\n",
1295 |        "    </tr>\n",
1296 |        "  </thead>\n",
1297 |        "  <tbody>\n",
1298 |        "    <tr>\n",
1299 |        "      <th>0</th>\n",
1300 |        "      <td>872225</td>\n",
1301 |        "      <td>10959</td>\n",
1302 |        "      <td>4.9</td>\n",
1303 |        "      <td>NaN</td>\n",
1304 |        "      <td>YES</td>\n",
1305 |        "    </tr>\n",
1306 |        "    <tr>\n",
1307 |        "      <th>1</th>\n",
1308 |        "      <td>872226</td>\n",
1309 |        "      <td>10959</td>\n",
1310 |        "      <td>5.4</td>\n",
1311 |        "      <td>NaN</td>\n",
1312 |        "      <td>YES</td>\n",
1313 |        "    </tr>\n",
1314 |        "    <tr>\n",
1315 |        "      <th>2</th>\n",
1316 |        "      <td>872227</td>\n",
1317 |        "      <td>10959</td>\n",
1318 |        "      <td>5.0</td>\n",
1319 |        "      <td>NaN</td>\n",
1320 |        "      <td>YES</td>\n",
1321 |        "    </tr>\n",
1322 |        "    <tr>\n",
1323 |        "      <th>3</th>\n",
1324 |        "      <td>872245</td>\n",
1325 |        "      <td>10959</td>\n",
1326 |        "      <td>5.2</td>\n",
1327 |        "      <td>NaN</td>\n",
1328 |        "      <td>YES</td>\n",
1329 |        "    </tr>\n",
1330 |        "    <tr>\n",
1331 |        "      <th>4</th>\n",
1332 |        "      <td>872246</td>\n",
1333 |        "      <td>10959</td>\n",
1334 |        "      <td>5.4</td>\n",
1335 |        "      <td>NaN</td>\n",
1336 |        "      <td>YES</td>\n",
1337 |        "    </tr>\n",
1338 |        "  </tbody>\n",
1339 |        "</table>\n",
1340 |        "</div>"
1341 |       ],
1342 |       "text/plain": [
1343 |        "   sample_id  method_id  value flag1 approved\n",
1344 |        "0     872225      10959    4.9   NaN      YES\n",
1345 |        "1     872226      10959    5.4   NaN      YES\n",
1346 |        "2     872227      10959    5.0   NaN      YES\n",
1347 |        "3     872245      10959    5.2   NaN      YES\n",
1348 |        "4     872246      10959    5.4   NaN      YES"
1349 |       ]
1350 |      },
1351 |      "execution_count": 24,
1352 |      "metadata": {},
1353 |      "output_type": "execute_result"
1354 |     }
1355 |    ],
1356 |    "source": [
1357 |     "# Get ws_ids\n",
1358 |     "stn_list = list(ws_df['station_id'].unique().astype(str))\n",
1359 |     "stn_txt = ','.join(stn_list)\n",
1360 |     "\n",
1361 |     "sql = text(\"SELECT water_sample_id, station_id, sample_date, depth1, depth2 \"\n",
1362 |     "           \"FROM resa2.water_samples \"\n",
1363 |     "           \"WHERE station_id in (%s)\" % stn_txt)\n",
1364 |     "\n",
1365 |     "samp_df = pd.read_sql(sql, eng)\n",
1366 |     "\n",
1367 |     "# Link to faun data\n",
1368 |     "df = pd.merge(faun_df, \n",
1369 |     "              samp_df, \n",
1370 |     "              how='left', \n",
1371 |     "              on=['station_id', 'sample_date', 'depth1', 'depth2'],\n",
1372 |     "             )\n",
1373 |     "\n",
1374 |     "df.drop(['station_id', 'station_code', 'sample_date', 'depth1', 'depth2'], \n",
1375 |     "        axis=1, \n",
1376 |     "        inplace=True)\n",
1377 |     "\n",
1378 |     "# Convert to long format\n",
1379 |     "df = df.melt(id_vars='water_sample_id', \n",
1380 |     "             var_name='method_name').dropna()\n",
1381 |     "\n",
1382 |     "# Join method IDs\n",
1383 |     "df = pd.merge(df, \n",
1384 |     "              meth_df[['method_name', 'wc_method_id']],\n",
1385 |     "              how='left',\n",
1386 |     "              on='method_name',\n",
1387 |     "             )\n",
1388 |     "\n",
1389 |     "# Deal with flags\n",
1390 |     "df['value'] = df['value'].astype(str)\n",
1391 |     "df['flag1'] = df.apply(f, axis=1)\n",
1392 |     "\n",
1393 |     "# Extract numeric chars\n",
1394 |     "df['value'] = df['value'].str.extract(\"([-+]?\\d*\\.\\d+|\\d+)\", expand=True)\n",
1395 |     "df['value'] = df['value'].astype(float)\n",
1396 |     "\n",
1397 |     "# Reorder\n",
1398 |     "df = df[['water_sample_id', 'wc_method_id', 'value', 'flag1']]\n",
1399 |     "df.columns = ['sample_id', 'method_id', 'value', 'flag1']\n",
1400 |     "df['approved'] = 'YES'\n",
1401 |     "\n",
1402 |     "df.head()"
1403 |    ]
1404 |   },
1405 |   {
1406 |    "cell_type": "code",
1407 |    "execution_count": 25,
1408 |    "metadata": {},
1409 |    "outputs": [],
1410 |    "source": [
1411 |     "## Add to db\n",
1412 |     "#df.to_sql('water_chemistry_values2', \n",
1413 |     "#          eng, \n",
1414 |     "#          schema='RESA2', \n",
1415 |     "#          if_exists='append', \n",
1416 |     "#          index=False,\n",
1417 |     "#         )"
1418 |    ]
1419 |   },
1420 |   {
1421 |    "cell_type": "markdown",
1422 |    "metadata": {},
1423 |    "source": [
1424 |     "### 7.4. Add to sample selection"
1425 |    ]
1426 |   },
1427 |   {
1428 |    "cell_type": "code",
1429 |    "execution_count": 26,
1430 |    "metadata": {},
1431 |    "outputs": [],
1432 |    "source": [
1433 |     "# Build df\n",
1434 |     "ws_df = pd.DataFrame({'water_sample_id':df['sample_id'].unique()})\n",
1435 |     "ws_df['sample_selection_id'] = 66\n",
1436 |     "\n",
1437 |     "## Write to db\n",
1438 |     "#ws_df.to_sql('sample_selections', \n",
1439 |     "#             eng, \n",
1440 |     "#             schema='RESA2', \n",
1441 |     "#             if_exists='append', \n",
1442 |     "#             index=False,\n",
1443 |     "#            )"
1444 |    ]
1445 |   },
1446 |   {
1447 |    "cell_type": "markdown",
1448 |    "metadata": {},
1449 |    "source": [
1450 |     "## 8. Additions from Liv Bente\n",
1451 |     "\n",
1452 |     "After some further checking, Liv Bente has identified some additional samples that should be included (see e-mail received 20.08.2020 at 16:30). These samples are listed in \n",
1453 |     "\n",
1454 |     "    biolok\\water_samples_to_add_2020-08-21.xlsx"
1455 |    ]
1456 |   },
1457 |   {
1458 |    "cell_type": "code",
1459 |    "execution_count": 5,
1460 |    "metadata": {},
1461 |    "outputs": [
1462 |     {
1463 |      "data": {
1464 |       "text/html": [
1465 |        "<div>\n",
1466 |        "<style scoped>\n",
1467 |        "    .dataframe tbody tr th:only-of-type {\n",
1468 |        "        vertical-align: middle;\n",
1469 |        "    }\n",
1470 |        "\n",
1471 |        "    .dataframe tbody tr th {\n",
1472 |        "        vertical-align: top;\n",
1473 |        "    }\n",
1474 |        "\n",
1475 |        "    .dataframe thead th {\n",
1476 |        "        text-align: right;\n",
1477 |        "    }\n",
1478 |        "</style>\n",
1479 |        "<table border=\"1\" class=\"dataframe\">\n",
1480 |        "  <thead>\n",
1481 |        "    <tr style=\"text-align: right;\">\n",
1482 |        "      <th></th>\n",
1483 |        "      <th>station_id</th>\n",
1484 |        "      <th>station_code</th>\n",
1485 |        "      <th>station_name</th>\n",
1486 |        "      <th>date</th>\n",
1487 |        "      <th>depth1</th>\n",
1488 |        "      <th>depth2</th>\n",
1489 |        "    </tr>\n",
1490 |        "  </thead>\n",
1491 |        "  <tbody>\n",
1492 |        "    <tr>\n",
1493 |        "      <th>0</th>\n",
1494 |        "      <td>195</td>\n",
1495 |        "      <td>1502-602</td>\n",
1496 |        "      <td>Lunddalsvatnet</td>\n",
1497 |        "      <td>2015-05-26</td>\n",
1498 |        "      <td>0</td>\n",
1499 |        "      <td>12.5</td>\n",
1500 |        "    </tr>\n",
1501 |        "    <tr>\n",
1502 |        "      <th>1</th>\n",
1503 |        "      <td>195</td>\n",
1504 |        "      <td>1502-602</td>\n",
1505 |        "      <td>Lunddalsvatnet</td>\n",
1506 |        "      <td>2015-06-30</td>\n",
1507 |        "      <td>0</td>\n",
1508 |        "      <td>15.0</td>\n",
1509 |        "    </tr>\n",
1510 |        "    <tr>\n",
1511 |        "      <th>2</th>\n",
1512 |        "      <td>195</td>\n",
1513 |        "      <td>1502-602</td>\n",
1514 |        "      <td>Lunddalsvatnet</td>\n",
1515 |        "      <td>2015-07-27</td>\n",
1516 |        "      <td>0</td>\n",
1517 |        "      <td>0.0</td>\n",
1518 |        "    </tr>\n",
1519 |        "    <tr>\n",
1520 |        "      <th>3</th>\n",
1521 |        "      <td>195</td>\n",
1522 |        "      <td>1502-602</td>\n",
1523 |        "      <td>Lunddalsvatnet</td>\n",
1524 |        "      <td>2015-08-19</td>\n",
1525 |        "      <td>0</td>\n",
1526 |        "      <td>12.0</td>\n",
1527 |        "    </tr>\n",
1528 |        "    <tr>\n",
1529 |        "      <th>4</th>\n",
1530 |        "      <td>195</td>\n",
1531 |        "      <td>1502-602</td>\n",
1532 |        "      <td>Lunddalsvatnet</td>\n",
1533 |        "      <td>2015-09-21</td>\n",
1534 |        "      <td>0</td>\n",
1535 |        "      <td>14.0</td>\n",
1536 |        "    </tr>\n",
1537 |        "  </tbody>\n",
1538 |        "</table>\n",
1539 |        "</div>"
1540 |       ],
1541 |       "text/plain": [
1542 |        "   station_id station_code    station_name       date  depth1  depth2\n",
1543 |        "0         195     1502-602  Lunddalsvatnet 2015-05-26       0    12.5\n",
1544 |        "1         195     1502-602  Lunddalsvatnet 2015-06-30       0    15.0\n",
1545 |        "2         195     1502-602  Lunddalsvatnet 2015-07-27       0     0.0\n",
1546 |        "3         195     1502-602  Lunddalsvatnet 2015-08-19       0    12.0\n",
1547 |        "4         195     1502-602  Lunddalsvatnet 2015-09-21       0    14.0"
1548 |       ]
1549 |      },
1550 |      "execution_count": 5,
1551 |      "metadata": {},
1552 |      "output_type": "execute_result"
1553 |     }
1554 |    ],
1555 |    "source": [
1556 |     "# Read list of post-2014 non-FAUN samples\n",
1557 |     "samp_df = pd.read_excel('../water_samples_to_add_2020-08-21.xlsx',\n",
1558 |     "                        sheet_name='to_add')\n",
1559 |     "samp_df.head()"
1560 |    ]
1561 |   },
1562 |   {
1563 |    "cell_type": "code",
1564 |    "execution_count": 8,
1565 |    "metadata": {},
1566 |    "outputs": [
1567 |     {
1568 |      "data": {
1569 |       "text/html": [
1570 |        "<div>\n",
1571 |        "<style scoped>\n",
1572 |        "    .dataframe tbody tr th:only-of-type {\n",
1573 |        "        vertical-align: middle;\n",
1574 |        "    }\n",
1575 |        "\n",
1576 |        "    .dataframe tbody tr th {\n",
1577 |        "        vertical-align: top;\n",
1578 |        "    }\n",
1579 |        "\n",
1580 |        "    .dataframe thead th {\n",
1581 |        "        text-align: right;\n",
1582 |        "    }\n",
1583 |        "</style>\n",
1584 |        "<table border=\"1\" class=\"dataframe\">\n",
1585 |        "  <thead>\n",
1586 |        "    <tr style=\"text-align: right;\">\n",
1587 |        "      <th></th>\n",
1588 |        "      <th>station_id</th>\n",
1589 |        "      <th>station_code</th>\n",
1590 |        "      <th>station_name</th>\n",
1591 |        "      <th>date</th>\n",
1592 |        "      <th>depth1</th>\n",
1593 |        "      <th>depth2</th>\n",
1594 |        "      <th>water_sample_id</th>\n",
1595 |        "    </tr>\n",
1596 |        "  </thead>\n",
1597 |        "  <tbody>\n",
1598 |        "    <tr>\n",
1599 |        "      <th>0</th>\n",
1600 |        "      <td>195</td>\n",
1601 |        "      <td>1502-602</td>\n",
1602 |        "      <td>Lunddalsvatnet</td>\n",
1603 |        "      <td>2015-05-26</td>\n",
1604 |        "      <td>0</td>\n",
1605 |        "      <td>12.5</td>\n",
1606 |        "      <td>872164</td>\n",
1607 |        "    </tr>\n",
1608 |        "    <tr>\n",
1609 |        "      <th>1</th>\n",
1610 |        "      <td>195</td>\n",
1611 |        "      <td>1502-602</td>\n",
1612 |        "      <td>Lunddalsvatnet</td>\n",
1613 |        "      <td>2015-06-30</td>\n",
1614 |        "      <td>0</td>\n",
1615 |        "      <td>15.0</td>\n",
1616 |        "      <td>872160</td>\n",
1617 |        "    </tr>\n",
1618 |        "    <tr>\n",
1619 |        "      <th>2</th>\n",
1620 |        "      <td>195</td>\n",
1621 |        "      <td>1502-602</td>\n",
1622 |        "      <td>Lunddalsvatnet</td>\n",
1623 |        "      <td>2015-07-27</td>\n",
1624 |        "      <td>0</td>\n",
1625 |        "      <td>0.0</td>\n",
1626 |        "      <td>872166</td>\n",
1627 |        "    </tr>\n",
1628 |        "    <tr>\n",
1629 |        "      <th>3</th>\n",
1630 |        "      <td>195</td>\n",
1631 |        "      <td>1502-602</td>\n",
1632 |        "      <td>Lunddalsvatnet</td>\n",
1633 |        "      <td>2015-08-19</td>\n",
1634 |        "      <td>0</td>\n",
1635 |        "      <td>12.0</td>\n",
1636 |        "      <td>872158</td>\n",
1637 |        "    </tr>\n",
1638 |        "    <tr>\n",
1639 |        "      <th>4</th>\n",
1640 |        "      <td>195</td>\n",
1641 |        "      <td>1502-602</td>\n",
1642 |        "      <td>Lunddalsvatnet</td>\n",
1643 |        "      <td>2015-09-21</td>\n",
1644 |        "      <td>0</td>\n",
1645 |        "      <td>14.0</td>\n",
1646 |        "      <td>872156</td>\n",
1647 |        "    </tr>\n",
1648 |        "  </tbody>\n",
1649 |        "</table>\n",
1650 |        "</div>"
1651 |       ],
1652 |       "text/plain": [
1653 |        "   station_id station_code    station_name       date  depth1  depth2  \\\n",
1654 |        "0         195     1502-602  Lunddalsvatnet 2015-05-26       0    12.5   \n",
1655 |        "1         195     1502-602  Lunddalsvatnet 2015-06-30       0    15.0   \n",
1656 |        "2         195     1502-602  Lunddalsvatnet 2015-07-27       0     0.0   \n",
1657 |        "3         195     1502-602  Lunddalsvatnet 2015-08-19       0    12.0   \n",
1658 |        "4         195     1502-602  Lunddalsvatnet 2015-09-21       0    14.0   \n",
1659 |        "\n",
1660 |        "   water_sample_id  \n",
1661 |        "0           872164  \n",
1662 |        "1           872160  \n",
1663 |        "2           872166  \n",
1664 |        "3           872158  \n",
1665 |        "4           872156  "
1666 |       ]
1667 |      },
1668 |      "execution_count": 8,
1669 |      "metadata": {},
1670 |      "output_type": "execute_result"
1671 |     }
1672 |    ],
1673 |    "source": [
1674 |     "# Loop over data\n",
1675 |     "ws_list = []\n",
1676 |     "for idx, row in samp_df.iterrows():   \n",
1677 |     "    # Query RESA db\n",
1678 |     "    par_dict = {'stn_id':row['station_id'],\n",
1679 |     "                'sample_date':  row['date'].date(),\n",
1680 |     "                'depth1':row['depth1'],\n",
1681 |     "                'depth2':row['depth2'],\n",
1682 |     "               }\n",
1683 |     "    \n",
1684 |     "    sql = (\"SELECT * FROM resa2.water_samples \"\n",
1685 |     "           \"WHERE station_id = :stn_id \"\n",
1686 |     "           \"AND TRUNC(sample_date) = :sample_date \"\n",
1687 |     "           \"AND depth1 = :depth1 \"\n",
1688 |     "           \"AND depth2 = :depth2\")\n",
1689 |     "    \n",
1690 |     "    res = pd.read_sql(sql, con=eng, params=par_dict)\n",
1691 |     "    \n",
1692 |     "    if len(res) == 1:\n",
1693 |     "        ws_list.append(res['water_sample_id'].iloc[0])\n",
1694 |     "    elif len(res) == 0:\n",
1695 |     "        print(stn_code, row['date'].date(), len(res))\n",
1696 |     "        ws_list.append(np.nan)\n",
1697 |     "    else:\n",
1698 |     "        print(stn_code, row['date'].date(), len(res))\n",
1699 |     "        ws_list.append(-1)\n",
1700 |     "\n",
1701 |     "samp_df['water_sample_id'] = ws_list\n",
1702 |     "samp_df.head()"
1703 |    ]
1704 |   },
1705 |   {
1706 |    "cell_type": "code",
1707 |    "execution_count": 9,
1708 |    "metadata": {},
1709 |    "outputs": [],
1710 |    "source": [
1711 |     "## Add to sample selection\n",
1712 |     "#samp_df['sample_selection_id'] = 66\n",
1713 |     "#samp_df = samp_df[['water_sample_id', 'sample_selection_id']]\n",
1714 |     "#\n",
1715 |     "## Write to db\n",
1716 |     "#samp_df.to_sql('sample_selections', \n",
1717 |     "#               eng, \n",
1718 |     "#               schema='RESA2', \n",
1719 |     "#               if_exists='append', \n",
1720 |     "#               index=False,\n",
1721 |     "#              )"
1722 |    ]
1723 |   }
1724 |  ],
1725 |  "metadata": {
1726 |   "kernelspec": {
1727 |    "display_name": "Python 3",
1728 |    "language": "python",
1729 |    "name": "python3"
1730 |   },
1731 |   "language_info": {
1732 |    "codemirror_mode": {
1733 |     "name": "ipython",
1734 |     "version": 3
1735 |    },
1736 |    "file_extension": ".py",
1737 |    "mimetype": "text/x-python",
1738 |    "name": "python",
1739 |    "nbconvert_exporter": "python",
1740 |    "pygments_lexer": "ipython3",
1741 |    "version": "3.7.6"
1742 |   }
1743 |  },
1744 |  "nbformat": 4,
1745 |  "nbformat_minor": 4
1746 | }
1747 | 


--------------------------------------------------------------------------------