In [8]:
import os
import sys
from functools import singledispatch
import warnings

import pandas as pd
import numpy as np

from plio.examples import get_path
from plio.io.io_bae import read_gpf

In [9]:
# Reads a .atf file and outputs all of the 
# .ipf, .gpf, .sup, .prj, and path to locate the 
# .apf file (should be the same as all others) 
def read_atf(atf_file):
    with open(atf_file) as f:

        files = []
        ipf = []
        sup = []
        files_dict = []
        
        # Grabs every PRJ, GPF, SUP, and IPF image from the ATF file
        for line in f:
            if line[-4:-1] == 'prj' or line[-4:-1] == 'gpf' or line[-4:-1] == 'sup' or line[-4:-1] == 'ipf' or line[-4:-1] == 'atf':
                files.append(line)
        
        files = np.array(files)
        
        # Creates appropriate arrays for certain files in the right format
        for file in files:
            file = file.strip()
            file = file.split(' ')

            # Grabs all the IPF files
            if file[1].endswith('.ipf'):
                ipf.append(file[1])

            # Grabs all the SUP files
            if file[1].endswith('.sup'):
                sup.append(file[1])

            files_dict.append(file)

        # Creates a dict out of file lists for GPF, PRJ, IPF, and ATF
        files_dict = (dict(files_dict))
        
        # Sets the value of IMAGE_IPF to all IPF images
        files_dict['IMAGE_IPF'] = ipf
        
        # Sets the value of IMAGE_SUP to all SUP images
        files_dict['IMAGE_SUP'] = sup
        
        # Sets the value of PATH to the path of the ATF file
        files_dict['PATH'] = os.path.dirname(os.path.abspath(atf_file))
        
        return files_dict
    
@singledispatch
def read_ipf(arg):
    return str(arg)

@read_ipf.register(str)
def read_ipf_str(input_data):
    """
    Read a socet ipf file into a pandas data frame

    Parameters
    ----------
    input_data : str
                 path to the an input data file

    Returns
    -------
    df : pd.DataFrame
         containing the ipf data with appropriate column names and indices
    """

    # Check that the number of rows is matching the expected number
    with open(input_data, 'r') as f:
        for i, l in enumerate(f):
            if i == 1:
                cnt = int(l)
            elif i == 2:
                col = l
                break
                
    columns = np.genfromtxt(input_data, skip_header=2, dtype='unicode',
                            max_rows = 1, delimiter = ',')

    # TODO: Add unicode conversion
    d = [line.split() for line in open(input_data, 'r')]
    d = np.hstack(np.array(d[3:]))
    
    d = d.reshape(-1, 12)
    
    df = pd.DataFrame(d, columns=columns)
    file = os.path.split(os.path.splitext(input_data)[0])[1]
    df['ipf_file'] = pd.Series(np.full((len(df['pt_id'])), file), index = df.index)

    assert int(cnt) == len(df), 'Dataframe length {} does not match point length {}.'.format(int(cnt), len(df))
    
    # Soft conversion of numeric types to numerics, allows str in first col for point_id
    df = df.apply(pd.to_numeric, errors='ignore')

    return df

@read_ipf.register(list)
def read_ipf_list(input_data_list):
    """
    Read a socet ipf file into a pandas data frame

    Parameters
    ----------
    input_data_list : list
                      list of paths to the a set of input data files

    Returns
    -------
    df : pd.DataFrame
         containing the ipf data with appropriate column names and indices
    """
    frames = []

    for input_file in input_data_list:
        frames.append(read_ipf(input_file))

    df = pd.concat(frames)

    return df

In [10]:
atf_dict = read_atf(get_path('CTX_Athabasca_Middle_step0.atf'))

gpf_file = os.path.join(atf_dict['PATH'], atf_dict['GP_FILE']);
ipf_list = [os.path.join(atf_dict['PATH'], i) for i in atf_dict['IMAGE_IPF']]

gpf_df = read_gpf(gpf_file).set_index('point_id')
ipf_df = read_ipf(ipf_list).set_index('pt_id')

point_diff = ipf_df.index.difference(gpf_df.index)

if len(point_diff) != 0:
    warnings.warn("The following points found in ipf files missing from gpf file: \n\n{}. \
                  \n\nContinuing, but these points will be missing from the control network".format(list(point_diff)))

new_df = ipf_df.merge(gpf_df, left_index=True, right_index=True)
new_df


['P03_002226_1895_XI_09N203W_15', 'P03_002226_1895_XI_09N203W_16', 'P03_002226_1895_XI_09N203W_17', 'P03_002226_1895_XI_09N203W_18', 'P03_002226_1895_XI_09N203W_19', 'P03_002226_1895_XI_09N203W_20', 'P03_002226_1895_XI_09N203W_21', 'P03_002226_1895_XI_09N203W_22', 'P03_002226_1895_XI_09N203W_24', 'P03_002226_1895_XI_09N203W_26', 'P03_002226_1895_XI_09N203W_30', 'P03_002226_1895_XI_09N203W_31', 'P03_002226_1895_XI_09N203W_32', 'P03_002226_1895_XI_09N203W_34', 'P03_002226_1895_XI_09N203W_36', 'P03_002226_1895_XI_09N203W_37', 'P03_002226_1895_XI_09N203W_44', 'P03_002226_1895_XI_09N203W_48', 'P03_002226_1895_XI_09N203W_49', 'P03_002226_1895_XI_09N203W_56', 'P03_002226_1895_XI_09N203W_57', 'P03_002226_1895_XI_09N203W_61', 'P03_002226_1895_XI_09N203W_62', 'P03_002226_1895_XI_09N203W_63', 'P03_002226_1895_XI_09N203W_65', 'P19_008344_1894_XN_09N203W_4', 'P20_008845_1894_XN_09N203W_15'].                   

Continuing, but these points will be missing from the control network
  if sys.path[0] 

Unnamed: 0,val,fid_val,no_obs,l.,s.,sig_l,sig_s,res_l,res_s,fid_x,...,known,lat_Y_North,long_X_East,ht,sig0,sig1,sig2,res0,res1,res2
10_8344_8845_4r,1,0,0,-2919.380615,1052.729004,0.000000,0.000000,0.059914,0.930311,0.0,...,0,0.159378,2.724649,-2523.828227,0.0,0.0,25.000000,18.301328,44.206259,416.201741
10_8344_8845_4r,1,0,0,-4044.697510,1008.950928,0.000000,0.000000,0.063678,0.661294,0.0,...,0,0.159378,2.724649,-2523.828227,0.0,0.0,25.000000,18.301328,44.206259,416.201741
10_8344_8845_4r,1,0,0,1700.584473,-2390.001709,0.000000,0.000000,-0.063695,-1.055619,0.0,...,0,0.159378,2.724649,-2523.828227,0.0,0.0,25.000000,18.301328,44.206259,416.201741
10_8344_8845_4r,1,0,0,2006.141113,-2234.915283,0.000000,0.000000,0.318779,-0.585138,0.0,...,0,0.159378,2.724649,-2523.828227,0.0,0.0,25.000000,18.301328,44.206259,416.201741
11_8344_8845_4r,1,0,0,370.151917,2340.653076,0.000000,0.000000,-0.239226,-1.113693,0.0,...,0,0.164905,2.721815,-2445.237027,0.0,0.0,30.000000,-22.046575,103.403228,173.210013
11_8344_8845_4r,1,0,0,-761.216064,2303.787109,0.000000,0.000000,-0.247307,-0.587299,0.0,...,0,0.164905,2.721815,-2445.237027,0.0,0.0,30.000000,-22.046575,103.403228,173.210013
11_8344_8845_4r,1,0,0,4985.437988,-1070.364990,0.000000,0.000000,0.239207,1.080801,0.0,...,0,0.164905,2.721815,-2445.237027,0.0,0.0,30.000000,-22.046575,103.403228,173.210013
11_8344_8845_4r,1,0,0,5293.700195,-993.390625,0.000000,0.000000,0.672877,0.626316,0.0,...,0,0.164905,2.721815,-2445.237027,0.0,0.0,30.000000,-22.046575,103.403228,173.210013
12_8344_8845_4r,1,0,0,236.395218,984.833252,0.000000,0.000000,0.073683,-0.237114,0.0,...,0,0.164949,2.724076,-2606.935163,0.0,0.0,100.000000,-7.549561,93.170584,180.058858
12_8344_8845_4r,1,0,0,-889.364441,966.533997,0.000000,0.000000,-0.251753,0.008170,0.0,...,0,0.164949,2.724076,-2606.935163,0.0,0.0,100.000000,-7.549561,93.170584,180.058858
