为什么 Dash 在上传文件时会出现解析错误？

Question

上传 Excel 或 CSV 导致错误。我遵循了 Dash 演示，但是一旦我尝试扩展它来做一些像绘图这样的事情，它就不起作用了。我不想只显示 table。 Dash_Table 函数已更新，因此之前使用 Dash_Table_Experiments 的示例不再有效

我整晚都在进行堆栈交换，修改我的代码并阅读其他解决方案。下面提供了完整的工作代码。我还想通过分类变量向 "filter" 数据添加一个下拉回调函数。

 import base64
 import datetime
 import io
 import plotly.graph_objs as go
 import dash
 from dash.dependencies import Input, Output, State
 import dash_core_components as dcc
 import dash_html_components as html
 import dash_table

 import pandas as pd


 external_stylesheets = ['https://codepen.io/chriddyp/pen/bWLwgP.css']

 app = dash.Dash(__name__, external_stylesheets=external_stylesheets)

 app.layout = html.Div([
  dcc.Upload(
      id='upload-data',
      children=html.Div([
        'Drag and Drop or ',
        html.A('Select Files')
    ]),
    style={
        'width': '100%',
        'height': '60px',
        'lineHeight': '60px',
        'borderWidth': '1px',
        'borderStyle': 'dashed',
        'borderRadius': '5px',
        'textAlign': 'center',
        'margin': '10px'
    },
    # Allow multiple files to be uploaded
    multiple=False
  ),
  html.Div(id='output-data-upload'),
  dcc.Graph(id='graph1')
 ])


 def parse_contents(contents, filename):
   content_type, content_string = contents.split(',')

   decoded = base64.b64decode(content_string)

   try:
       if 'csv' in filename:
         # Assume that the user uploaded a CSV file
          df = pd.read_csv(
            io.StringIO(decoded.decode('utf-8')))
       elif 'xls' in filename:
          # Assume that the user uploaded an excel file
          df = pd.read_excel(io.BytesIO(decoded))
   except Exception as e:
       print(e)
       return html.Div([
           'There was an error processing this file.'
       ])

return html.Div([
    html.H5(filename),
    # html.H6(datetime.datetime.fromtimestamp(date)),

    dash_table.DataTable(
        data=df.to_dict('records'),
        columns=[{'name': i, 'id': i} for i in df.columns]
    ),

    html.Hr(),  # horizontal line
    # For debugging, display the raw contents provided by the web browser
    html.Div('Raw Content'),
    html.Pre(contents[0:200] + '...', style={
        'whiteSpace': 'pre-wrap',
        'wordBreak': 'break-all'
    })
 ])


 @app.callback(Output('output-data-upload', 'children'),
          [Input('upload-data', 'contents')],
          [State('upload-data', 'filename')])
 def update_output(list_of_contents, list_of_names):
   if list_of_contents is not None:
       children = [
           parse_contents(c, n) for c, n in
           zip(list_of_contents, list_of_names)]
      return children

@app.callback(
   Output('graph1', 'figure'),
   [Input('upload-data', 'contents'),
   Input('upload-data', 'filename')])

def plot_graph(contents, filename):
   df = parse_contents(contents, filename)
   trace1 = go.Bar(
        x=df['Quarter'],
        y=df['Score'],
    )

layout = go.Layout(
    title='graph1'

)
fig = go.Figure(data = [trace1], layout=layout)
return fig

if __name__ == '__main__':
   app.run_server(debug=True)

我得到的错误是：回调错误更新输出数据-upload.children：ValueError：没有足够的值来解压（预期 2，得到 1）

和

AttributeError: 'NoneType' 对象没有属性 'split'

问题似乎与 python 处理解析器的方式有关：

  def parse_contents(contents, filename):
     content_type, content_string = contents.split(',')

   decoded = base64.b64decode(content_string)

但是 none 的解决方案似乎可以解决问题。

请帮忙。由于很多人都在为这个问题苦苦挣扎（看起来），如果我们能够解决它并且 post 一个功能代码 (Github?) 可以完成 Shiny 已经很容易做到的事情，那就太好了。

Answer 1

您的代码：

   children = [
       parse_contents(c, n) for c, n in
       zip(list_of_contents, list_of_names)]

然后

def parse_contents(contents, filename):
    content_type, content_string = contents.split(',')
    decoded = base64.b64decode(content_string)
    ...

这里错误发生在None中的c，那么parse_contents的contents参数是None，"None has no .split"发生错误。

如果c不是None而是只有一个词，那么contents.split()returns只有一个元素，就会出现"not enough values to unpack"错误。

我会过滤它：

pairs = zip(list_of_contents, list_of_names)
children = [parse_contents(c, n) for (c, n) in pairs if c and (len(c.split(',')) == 2)]

您也可以考虑在 parse_contents 之外进行拆分并更改其周围的代码。

我也会尝试记录内容错误的文件名，例如[n for (c, n) in pairs if not c or len(c.split(',')) != 2]).

Answer 2

解决了。在这里发帖供其他人使用：

def parse_contents(contents, filename):
if contents is not None:
    content_type, content_string = contents.split(',')

    decoded = base64.b64decode(content_string)

    try:
        if 'csv' in filename:
            # Assume that the user uploaded a CSV file
            df = pd.read_csv(
                io.StringIO(decoded.decode('utf-8')))
        elif 'xlsx' in filename:
            # Assume that the user uploaded an excel file
            df = pd.read_excel(io.BytesIO(decoded))
    except Exception as e:
        print(e)
        return html.Div([
            'There was an error processing this file.'
        ])

    return df
else:
    return [{}]


@app.callback(Output('table', 'data'),
              [Input('upload-data', 'contents'),
              Input('upload-data', 'filename')])
def update_output(contents, filename):
    if contents is not None:
        df = parse_contents(contents, filename)
        if df is not None:
            return df.to_dict('records')
        else:
            return [{}]
    else:
        return [{}]
@app.callback(
    Output('graph1', 'figure'),
    [Input('upload-data', 'contents'),
     Input('upload-data', 'filename')])

def plot_graph(contents, filename):
    df = parse_contents(contents, filename)
    trace1 = go.Bar(
            x=df['Quarter'],
            y=df['Score'],
        )

    layout = go.Layout(
        title='graph1'

)
fig = go.Figure(data = [trace1], layout=layout)
return fig

为什么 Dash 在上传文件时会出现解析错误？

Why is Dash giving a parse error when uploading files?

python

plotly

plotly-dash