
我在一个文件夹中有一个zip文件A001-C-002.zip和一个。xlsx文件HUBMAP B004 codex antibodies metadata.xlsx。首先,我想读取xlsx文件并将其转换为数据帧。接下来,我要处理zip文件中的所有文件。

from pathlib import Path
import pandas as pd
import zipfile
import os
import sys
path = "./../../"
for filename in os.listdir(os.getcwd()):
with open(os.path.join(os.getcwd(), filename), 'r') as f:
with open("HUBMAP B004 codex antibodies metadata.xlsx", 'r') as ab:
ab_df = pd.read_excel(ab)
print(f"Antibody metadata column names:n {ab_df.columns.values}")

# Patient A001
with zipfile.ZipFile(path / "") as z:
for filename in z.namelist():
if not os.path.isdir(filename):
for line in


> --------------------------------------------------------------------------- UnicodeDecodeError                        Traceback (most recent call
> last) /tmp/ipykernel_3212/ in <module>
>       2     with open(os.path.join(os.getcwd(), filename), 'r') as f:
>       3         with open("HUBMAP B004 codex antibodies metadata.xlsx", 'r') as ab:
> ----> 4             ab_df = pd.read_excel(ab)
>       5             print(f"Antibody metadata column names:n {ab_df.columns.values}")
>       6 
> UnicodeDecodeError: 'utf-8' codec can't decode byte 0x9a in position
> 15: invalid start byte




df = pd.read_excel("HUBMAP B004 codex antibodies metadata.xlsx")
