Skip to content
Snippets Groups Projects
Verified Commit a7a39b33 authored by Timm Fitschen's avatar Timm Fitschen
Browse files

WIP load tsv from file

parent af7d933b
No related branches found
No related tags found
No related merge requests found
...@@ -31,27 +31,18 @@ import sys ...@@ -31,27 +31,18 @@ import sys
import pandas as pd import pandas as pd
def _parse_to_dataframe(csv_string): def _parse_to_dataframe(tsv_file):
"""Attempts to create a valid dataframe from a CSV string. """Attempts to create a valid dataframe from a TSV file.
The CSV string typically starts with a header like this:
```
data:text/csv;charset=utf-8,colname1 colname2
value1 value2
...
```
Parameters Parameters
---------- ----------
csv_string : The URL encoded CSV content, starts with `data:text/csv`. tsv_file : path to a tsv file.
Returns Returns
------- -------
out : The created dataframe. out : The created dataframe.
""" """
csv_string = csv_string.split(",")[1] dataframe = pd.read_csv(tsv_file, sep="\t")
sio = io.StringIO(csv_string)
dataframe = pd.read_csv(sio, sep="\t")
return dataframe return dataframe
...@@ -100,15 +91,15 @@ def _parse_arguments(): ...@@ -100,15 +91,15 @@ def _parse_arguments():
tempdir = os.environ["SHARED_DIR"] tempdir = os.environ["SHARED_DIR"]
parser.add_argument('-t', '--tempdir', required=False, default=tempdir, parser.add_argument('-t', '--tempdir', required=False, default=tempdir,
help="Temporary dir for saving the result.") help="Temporary dir for saving the result.")
parser.add_argument('-u', '--urlencoded', required=True,
help="The URL encoded csv data.")
parser.add_argument('-a', '--auth-token', required=False, parser.add_argument('-a', '--auth-token', required=False,
help="An authentication token (not needed, only for compatibility).") help="An authentication token (not needed, only for compatibility).")
parser.add_argument('tsv', required=True,
help="The tsv file.")
return parser.parse_args() return parser.parse_args()
def main(): def main():
args = _parse_arguments() args = _parse_arguments()
dataframe = _parse_to_dataframe(args.urlencoded) dataframe = _parse_to_dataframe(args.tsv)
filename = _write_xls(dataframe, directory=args.tempdir) filename = _write_xls(dataframe, directory=args.tempdir)
print(filename) print(filename)
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment