description中fits解析——正则表达式
发布时间:2020-12-14 06:39:12 所属栏目:百科 来源:网络整理
导读:from functools import reduce import numpy as np import pandas as pd import re from bs4 import BeautifulSoup def get_description_string(description): RULES = [ # [r'^[sS](fitment)',""] [ r'Item[- ]?offered[sS]*$' , "" ],[ r'Item[- ]?Inc
from functools import reduce import numpy as np import pandas as pd import re from bs4 import BeautifulSoup def get_description_string(description): RULES = [ # [r'^[sS](fitment)',""] [r'Item[- ]?offered[sS]*$',""],[r'Item[- ]?Included[sS]*$',[r'position[sS]*$',[r'Material[sS]*$',[r'Item[- ]?Condition[sS]*$',[r'</(div|h|p)>','n'],[r'<br.*?>',[r'<[^>]+?>',''],[r' ',' '],[r'&','&'],[r'<','<'],[r'>','>'],[r'"','"'],[r'^[ns]*',[r'^s+',[r'^make[sS]*$',] result = reduce(lambda desc,rule: re.sub(rule[0],rule[1],desc,flags=re.I | re.M),RULES,description).strip() return result def description_parse(infile,outfile): df = pd.read_excel(infile,encoding="utf-8") df["description"]=df["description"].fillna("") print(df.info()) dataframe = [] for ind in df.index: sku = df.loc[ind,"product_sku"] print(sku) des = df.loc[ind,"description"] des = get_description_string(des) print(des) df.loc[ind,"fit"]=des df.to_excel(outfile,index=False) description_parse("ACES_fitment_description.xlsx","ACES_fitment_description_parse.xlsx") (编辑:李大同) 【声明】本站内容均来自网络,其相关言论仅代表作者个人观点,不代表本站立场。若无意侵犯到您的权利,请及时与联系站长删除相关内容! |