正则
import reimport pandas as pd
def get_number(input):
numeric_pattern = re.compile(r'[0-9']
return ''.join(numeric_pattern.findall(input))
def get_letter(input):
lettern_pattern = re.compile(r'[a-zA-Z]')
return ''.join(lettern_pattern.findall(input))
def get_chinese(input):
pattern = re.compile('[0-9a-zA-Z']
return pattern.sub('', input)
df['name']
断肠草30g
狗尾吧草110kg
熊胆2g
df['weight'] = df['name'].apply(get_numeric)
df['unit'] = df['name'].apply(get_letter)
df['name'] = df['name'].apply(get_chinese)
print(df) #即可