compton
/
sources


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242
							"""
The script is for corresponding the elabels from database and compton average measurements
run it on cc-8 with the command:
`python3 elabelizer.py`

If this script is not working properly, try to setup environment firstly with the following command in bash:
`source /sl/cmd3/cc8-64/Cmd3Off/tune.cmd3_runs_scripts.sh`

This script is inspired by listoffdata.py script (/sl/cmd3/cc7-64/Cmd3Off/scripts/listoffdata.py)
"""

from datetime import datetime
from typing import Dict, List, Tuple, NamedTuple, Optional
from pathlib import Path
from urllib.request import urlopen

import json
import os 

os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'settings_read_all')
API_KEY = "9e3b3d9b7a57098bb1bc0e5c5053f2084251cd00"

import django
django.setup()
from cmdweb.apps.cmd3off.energypoints.models import EnergyPoint, Param, ParamData

class RowEPoint(NamedTuple):
    """Structure of the energy point metadata"""
    elabel: str
    first_run: int
    last_run: int
    nominal_energy: float
    start_time: datetime
    stop_time: datetime
    season: str

class AvgEPoint(NamedTuple):
    """Structure of the averaged beam energy point"""
    energy_mean: float
    first_run: int
    last_run: int
    nominal_energy: float
    season: str

class CombinedEPoint(NamedTuple):
    """Structure of the combined energy point"""
    season: str
    elabel: Optional[str]
    energy_mean: Optional[float]


def retrieve_elabels(startrun: int, stoprun: int) -> List[RowEPoint]:
    """Retrieves elabels from database
    
    Parameters:
    -----------
    startrun : int
        first run for retrieving
    stoprun : int
        last run for retrieving
    
    Returns:
    --------
    List[RowEPoint]
        list of elabels and information about them
        (elabel, firstrun, lastrun, nominal energy, starttime, stoptime, season)
    """
    
    points, seasons = [], []
    # Get seasons (they are sorted by date)
    for e in EnergyPoint.objects.filter(name__startswith="Season"):
        info = [e.name[7:], e.startrun, e.endrun]
        seasons.append(info)
    
    # Get energy points (they are sorted by date) and match corresponing seasons
    season_idx = 0
    for e in EnergyPoint.objects.filter(startrun__gte=startrun, endrun__lte=stoprun):
        while((e.startrun < seasons[season_idx][1]) or (e.endrun > seasons[season_idx][2])):
            season_idx+=1
        info = RowEPoint(
            elabel = e.name, 
            first_run = e.startrun, 
            last_run = e.endrun, 
            nominal_energy = e.energy, 
            start_time = e.starttime, 
            stop_time = e.endtime, 
            season = seasons[season_idx][0]
        )
        if not(e.name.startswith("Season")):
            points.append(info)
    return points
    
def get_available_compton_seasons() -> Dict[str, str]:
    """Returns a dictionary containing all available 
    average energy season tables
    
    Returns
    -------
    Dict[str, str]
        keys are season names, values are pathes to the tables
    """

    tables_url = f'https://cmd.inp.nsk.su/~compton/gogs/api/v1/repos/compton/tables/contents/?token={API_KEY}'
    with urlopen(tables_url) as f:
        data_str = f.read().decode('utf-8')
        data = json.loads(data_str)
        datarows = {Path(row['name']).stem: row['download_url'] for row in
        filter(lambda x: (x['type'] == 'file') and x['name'].endswith('.csv'), data)}
    return datarows

def retrieve_comptons(season_names: Optional[List[str]] = None) -> List[AvgEPoint]:
    """Retrieves compton measurements from tables
    
    Parameters:
    -----------
    season_names: Optional[List[str]]
        list of seasons for retrieving
        (default is None, it means retrieving all available seasons)
    
    Returns:
    --------
    List[AvgEPoint]
        list of compton means measurements
        (season, energy_point, first_run, last_run, mean_energy)
        first_run and last_run can be different from the corresponding energy points from elabels database
    """
    
    available_seasons = get_available_compton_seasons()
    seasons = dict()
    if season_names is not None:
        for s in season_names:
            try:
                seasons[s] = available_seasons[s]
            except KeyError:
                raise ValueError(f"Season {s} is not found. List of available seasons: {available_seasons.keys()}")
    else:
        seasons = available_seasons
        
    def parse_compton_row(row: str, season: str) -> AvgEPoint:
        items = row.split(',')
        return AvgEPoint(
            season=season, 
            nominal_energy=float(items[0]), 
            first_run=int(items[1]), 
            last_run=int(items[2]), 
            energy_mean=float(items[3])
        )
    
    def retrieve_compton_one_season(season_name: str, season_table_url: str) -> List[AvgEPoint]:
        with urlopen(season_table_url) as f:
            r = f.read().decode('utf-8').strip()
            rows = list(map(lambda x: parse_compton_row(x, s_name), r.split('\n')[1:]))
        return rows
                    
    datarows = []
    for s_name, s_table in seasons.items():
        seasonrows = retrieve_compton_one_season(s_name, s_table)
        datarows.extend(seasonrows)
    
    return datarows
        
def combine_compton_elabel(epoints: List[RowEPoint], comptonpoints: List[AvgEPoint]) -> List[CombinedEPoint]:
    """Combines compton energy points and elabels from database
    
    Parameters:
    -----------
    epoints : List[RowEPoint]
        list of energy points
    comptonpoints : List[AvgEPoint]
        list of compton averaged points
    
    Returns:
    --------
    combpoints : List[CombinedEPoint]
        list of combined points (outer join)
    """
    
    epoints_sorted = sorted(epoints, key=lambda x: x.first_run)
    cpoints_sorted = sorted(comptonpoints, key=lambda x: x.first_run)
    
    combined_data = []
    
    eidx, cidx = 0, 0
    while (eidx < len(epoints_sorted)) and (cidx < len(cpoints_sorted)):
        erow = epoints_sorted[eidx]
        crow = cpoints_sorted[cidx]
        
        cstart, cstop, cenergy, cseason = crow.first_run, crow.last_run, crow.energy_mean, crow.season
        estart, estop, elabel, eseason = erow.first_run, erow.last_run, erow.elabel, erow.season
        
        if (cstart >= estart) and (cstop <= estop):
            combrow = CombinedEPoint(eseason, elabel, cenergy)
            eidx += 1
            cidx += 1
            #print(combrow)
        elif (cstart > estop):
            combrow = CombinedEPoint(eseason, elabel, None)
            eidx += 1
        elif (estart > cstop):
            combrow = CombinedEPoint(cseason, None, cenergy)
            cidx += 1
        else:
            raise Exception("Something wrong")
        
        # print(combrow)
        combined_data.append(combrow)
    
    for i in range(eidx, len(epoints_sorted)):
        erow = epoints_sorted[i]
        combrow = CombinedEPoint(erow.season, erow.elabel, None)
        combined_data.append(combrow)
        
    for i in range(cidx, len(cpoints_sorted)):
        crow = cpoints_sorted[i]
        combrow = CombinedEPoint(crow.season, None, crow.energy_mean)
        combined_data.append(combrow)
    
    return combined_data


def elabelize() -> List[CombinedEPoint]:
    RUNLIMITS = (17405, 200000)
    SEASONS = None
    epoints = retrieve_elabels(*RUNLIMITS)
    comptonpoints = retrieve_comptons(SEASONS)
    
    combdata = combine_compton_elabel(epoints, comptonpoints)
    return combdata
    
def main():
    combdata = elabelize()
    for c in combdata:
        season, elabel, energy = c.season, c.elabel, c.energy_mean
        if season is None:
            season = ''
        if elabel is None:
            elabel = ''
        print(f'{season:>15s}, {elabel:>13s}, {energy}')
    print('The number of not found points in compton is', len(list(filter(lambda x: x[2] is None, combdata))))
    
if __name__=="__main__":
    main()