在python pandas中搜索整行Dataframe的多个字符串值

相关文章推荐

睿智的跑步鞋 · nginx-重写和重定向关系与配置_ngin ...· 3 天前 ·

玩手机的数据线 · C++类模板声明与定义为何不能分开 - ...· 1 年前 ·

玉树临风的滑板 · 如何让这张图片在IFrame中打开？· 1 年前 ·

酒量大的蛋挞 · c# - Is it really ...· 1 年前 ·

害羞的篮球 · 谷歌将对Android广告跟踪进行更改意味着 ...· 1 年前 ·

import pandas as pd
#create sample data
data = {'model': ['Lisa', 'Lisa 2', 'Macintosh 128K', 'Macintosh 512K'],
        'launched': [1983,1984,1984,1984],
        'discontinued': [1986, 1985, 1984, 1986]}
df = pd.DataFrame(data, columns = ['model', 'launched', 'discontinued'])
df

l=['int', 'tos', '198']

df.model.str.contains('|'.join(l))
0    False
1    False
2     True
3     True

from functools import reduce
res = reduce(lambda a,b: a | b, [df[col].astype(str).str.contains(m) for col in df.columns])
0    False
1     True
2     True
3     True

df['new_col'] = res.astype(int)
     new_col
0    0
1    1
2    1
3    1

match = [ 'int', 'tos', '198']
df['isContained'] = df['model'].apply(lambda x: 1 if any(s in x for s in match) else 0)

            model  launched  discontinued  isContained
0            Lisa      1983          1986            0
1          Lisa 2      1984          1985            0
2  Macintosh 128K      1984          1984            1
3  Macintosh 512K      1984          1986            1

match = ['int', 'tos', '1985']
def string_finder(row, words):
    if any(word in field for field in row for word in words):
        return True
    return False
df['isContained'] = df.astype(str).apply(string_finder, words=match, axis=1)
print(df)
            model  launched  discontinued  isContained
0            Lisa      1983          1986        False
1          Lisa 2      1984          1985         True
2  Macintosh 128K      1984          1984         True
3  Macintosh 512K      1984          1986         True

def check_all_for(column_name, search_terms):
    df[column_name] = ''
    for row in df.iterrows():
        flag = 0
        for element in row:
            for search_term in search_terms:
                if search_term in (str(element)).lower():
                    flag = 1
        row[column_name] = flag

match = ['int', 'tos', '1984']
def string_finder(row, words):
    if any(word in field for field in row for word in words):
        return True
    return False
def AssessAllString (row,words):
    b=True
    for x in words:
      b = b&string_finder(row,[x])
    return b
df['isContained'] = df.astype(str).apply(AssessAllString, words=match, axis=1)
print(df)
            model  launched  discontinued  isContained
0  Lisa            1983      1986          False      
1  Lisa 2          1984      1985          False      
2  Macintosh 128K  1984      1984          True       
3  Macintosh 512K  1984      1986          True

match = ['isa','1984']
df['isContained'] = df.astype(str).apply(AssessAllString, words=match, axis=1)

在python pandas中搜索整行Dataframe的多个字符串值 内容来源于 Stack Overflow，遵循 CC BY-SA 4.0 许可协议进行翻译与使用。IT领域专用引擎提供翻译支持 腾讯云小微IT领域专用引擎提供翻译支持

5 个回答