Tagify / Tags.py
Palak Deb Patra
Upload 4 files
c650664 verified
# Topic labeling
insurance_keywords = [
"actuary",
"claims",
"coverage",
"deductible",
"policyholder",
"premium",
"underwriter",
"risk assessment",
"insurable interest",
"loss ratio",
"reinsurance",
"actuarial tables",
"property damage",
"liability",
"flood insurance",
"term life insurance",
"whole life insurance",
"health insurance",
"auto insurance",
"homeowners insurance",
"marine insurance",
"crop insurance",
"catastrophe insurance",
"umbrella insurance",
"pet insurance",
"travel insurance",
"professional liability insurance",
"disability insurance",
"long-term care insurance",
"annuity",
"pension plan",
"group insurance",
"insurtech",
"insured",
"insurer",
"subrogation",
"adjuster",
"third-party administrator",
"excess and surplus lines",
"captives",
"workers compensation",
"insurance fraud",
"health savings account",
"health maintenance organization",
"preferred provider organization",
]
finance_keywords = [
"asset",
"liability",
"equity",
"capital",
"portfolio",
"dividend",
"financial statement",
"balance sheet",
"income statement",
"cash flow statement",
"statement of retained earnings",
"financial ratio",
"valuation",
"bond",
"stock",
"mutual fund",
"exchange-traded fund",
"hedge fund",
"private equity",
"venture capital",
"mergers and acquisitions",
"initial public offering",
"secondary market",
"primary market",
"securities",
"derivative",
"option",
"futures",
"forward contract",
"swaps",
"commodities",
"credit rating",
"credit score",
"credit report",
"credit bureau",
"credit history",
"credit limit",
"credit utilization",
"credit counseling",
"credit card",
"debit card",
"ATM",
"bankruptcy",
"foreclosure",
"debt consolidation",
"taxes",
"tax return",
"tax deduction",
"tax credit",
"tax bracket",
"taxable income",
]
banking_capital_markets_keywords = [
"bank",
"credit union",
"savings and loan association",
"commercial bank",
"investment bank",
"retail bank",
"wholesale bank",
"online bank",
"mobile banking",
"checking account",
"savings account",
"money market account",
"certificate of deposit",
"loan",
"mortgage",
"home equity loan",
"line of credit",
"credit card",
"debit card",
"ATM",
"automated clearing house",
"wire transfer",
"ACH",
"SWIFT",
"international banking",
"foreign exchange",
"forex",
"currency exchange",
"central bank",
"Federal Reserve",
"interest rate",
"inflation",
"deflation",
"monetary policy",
"fiscal policy",
"quantitative easing",
"securities",
"stock",
"bond",
"mutual fund",
"exchange-traded fund",
"hedge fund",
"private equity",
"venture capital",
"investment management",
"portfolio management",
"wealth management",
"financial planning",
]
healthcare_life_sciences_keywords = [
"medical device",
"pharmaceutical",
"biotechnology",
"clinical trial",
"FDA",
"healthcare provider",
"healthcare plan",
"healthcare insurance",
"patient",
"doctor",
"nurse",
"pharmacist",
"hospital",
"clinic",
"healthcare system",
"healthcare policy",
"public health",
"healthcare IT",
"electronic health record",
"telemedicine",
"personalized medicine",
"genomics",
"proteomics",
"clinical research",
"drug development",
"drug discovery",
"medicine",
"health",
]
law_keywords = [
"law",
"legal",
"attorney",
"lawyer",
"litigation",
"arbitration",
"dispute resolution",
"contract law",
"intellectual property",
"corporate law",
"labor law",
"tax law",
"real estate law",
"environmental law",
"criminal law",
"family law",
"immigration law",
"bankruptcy law",
]
sports_keywords = [
"sports",
"football",
"basketball",
"baseball",
"hockey",
"soccer",
"golf",
"tennis",
"olympics",
"athletics",
"coaching",
"sports management",
"sports medicine",
"sports psychology",
"sports broadcasting",
"sports journalism",
"esports",
"fitness",
]
media_keywords = [
"media",
"entertainment",
"film",
"television",
"radio",
"music",
"news",
"journalism",
"publishing",
"public relations",
"advertising",
"marketing",
"social media",
"digital media",
"animation",
"graphic design",
"web design",
"video production",
]
manufacturing_keywords = [
"manufacturing",
"production",
"assembly",
"logistics",
"supply chain",
"quality control",
"lean manufacturing",
"six sigma",
"industrial engineering",
"process improvement",
"machinery",
"automation",
"aerospace",
"automotive",
"chemicals",
"construction materials",
"consumer goods",
"electronics",
"semiconductors",
]
automobile_keywords = [
"automotive",
"cars",
"trucks",
"SUVs",
"electric vehicles",
"hybrid vehicles",
"autonomous " "vehicles",
"car manufacturing",
"automotive design",
"car dealerships",
"auto parts",
"vehicle maintenance",
"car rental",
"fleet management",
"telematics",
]
telecom_keywords = [
"telecom",
"telecommunications",
"wireless",
"networks",
"internet",
"broadband",
"fiber optics",
"5G",
"telecom infrastructure",
"telecom equipment",
"VoIP",
"satellite communications",
"mobile devices",
"smartphones",
"telecom services",
"telecom regulation",
"telecom policy",
]
digital_world_keywords = [
"Artificial intelligence",
"Machine learning",
"Data Science",
"Big Data",
"Cloud Computing",
"Cybersecurity",
"Information security",
"Network security",
"Blockchain",
"Cryptocurrency",
"Internet of things",
"IoT",
"Web development",
"Mobile development",
"Frontend development",
"Backend development",
"Software engineering",
"Software development",
"Programming",
"Database",
"Data analytics",
"Business intelligence",
"DevOps",
"Agile",
"Scrum",
"Product management",
"Project management",
"IT consulting",
"IT service management",
"ERP",
"CRM",
"SaaS",
"PaaS",
"IaaS",
"Virtualization",
"Artificial reality",
"AR",
"Virtual reality",
"VR",
"Gaming",
"E-commerce",
"Digital marketing",
"SEO",
"SEM",
"Content marketing",
"Social media marketing",
"User experience",
"UX design",
"UI design",
"Cloud-native",
"Microservices",
"Serverless",
"Containerization",
]
technology_keywords = [
"technology",
"innovation",
"research",
"development",
"software",
"hardware",
"artificial intelligence",
"machine learning",
"data science",
"big data",
"cloud computing",
"cybersecurity",
"blockchain",
"internet of things",
"IoT",
"web development",
"mobile development",
"data analytics",
"business intelligence",
"virtual reality",
"VR",
"augmented reality",
"AR",
"gaming",
"e-commerce",
"digital marketing",
]
healthcare_keywords = [
"healthcare",
"medical",
"medicine",
"hospital",
"clinic",
"doctor",
"nurse",
"pharmacist",
"patient care",
"healthcare system",
"public health",
"healthcare policy",
"telemedicine",
"electronic health records",
"medical devices",
"clinical trials",
"pharmaceuticals",
]
education_keywords = [
"education",
"teaching",
"learning",
"school",
"university",
"college",
"student",
"teacher",
"curriculum",
"online education",
"e-learning",
"distance learning",
"educational technology",
"learning management system",
"educational resources",
]
energy_keywords = [
"energy",
"renewable energy",
"solar energy",
"wind energy",
"hydropower",
"nuclear energy",
"fossil fuels",
"oil",
"natural gas",
"coal",
"electricity",
"energy efficiency",
"smart grid",
"sustainability",
]
retail_keywords = [
"retail",
"shopping",
"e-commerce",
"online shopping",
"brick and mortar",
"store",
"customer",
"consumer behavior",
"inventory management",
"supply chain",
"logistics",
"retail analytics",
]
hospitality_keywords = [
"hospitality",
"hotel",
"restaurant",
"tourism",
"travel",
"hospitality management",
"customer service",
"guest experience",
"hospitality industry",
"event management",
]
real_estate_keywords = [
"real estate",
"property",
"home",
"house",
"apartment",
"commercial property",
"real estate agent",
"real estate market",
"mortgage",
"real estate investment",
"property management",
"housing market",
"rental properties",
]
agriculture_keywords = [
"agriculture",
"farming",
"crop",
"livestock",
"agribusiness",
"sustainable agriculture",
"precision agriculture",
"agricultural technology",
"food security",
]
environment_keywords = [
"environment",
"sustainability",
"conservation",
"climate change",
"renewable resources",
"ecology",
"green energy",
"eco-friendly",
"environmental policy",
"carbon footprint",
]
art_culture_keywords = [
"art",
"culture",
"creativity",
"music",
"film",
"literature",
"painting",
"sculpture",
"performing arts",
"cultural heritage",
"artistic expression",
]
travel_keywords = [
"travel",
"tourism",
"vacation",
"holiday",
"adventure",
"travel agency",
"travel planning",
"travel destination",
"sightseeing",
"cruise",
]
fashion_keywords = [
"fashion",
"clothing",
"apparel",
"style",
"designer",
"fashion trends",
"fashion industry",
"fashion show",
"fashion accessories",
"fashion retail",
]
architecture_keywords = [
"architecture",
"building",
"design",
"construction",
"architect",
"urban planning",
"architecture styles",
"sustainable architecture",
"interior design",
"landscape architecture",
]
aviation_keywords = [
"aviation",
"aircraft",
"airline",
"flight",
"pilot",
"aviation safety",
"aerospace",
"aviation technology",
"air traffic control",
"airport",
]
gaming_keywords = [
"gaming",
"video games",
"gamer",
"gaming industry",
"game development",
"esports",
"gaming community",
"gaming platform",
"online gaming",
"gaming tournaments",
]
food_beverage_keywords = [
"food",
"beverage",
"cuisine",
"restaurant",
"chef",
"culinary arts",
"food industry",
"food culture",
"food technology",
"food sustainability",
]
fitness_keywords = [
"fitness",
"exercise",
"workout",
"gym",
"fitness training",
"fitness equipment",
"health and fitness",
"personal training",
"fitness classes",
"wellness",
]
pharmaceuticals_keywords = [
"pharmaceuticals",
"drugs",
"medicine",
"pharmaceutical industry",
"drug development",
"clinical trials",
"pharmaceutical research",
"pharmacy",
"pharmacology",
"pharmaceutical manufacturing",
]
music_keywords = [
"music",
"musical",
"artist",
"concert",
"music production",
"music industry",
"music performance",
"music streaming",
"music festival",
"music education",
]
industries = {
"Insurance": insurance_keywords,
"Finance": finance_keywords,
"Banking": banking_capital_markets_keywords,
"Health": healthcare_life_sciences_keywords,
"Law": law_keywords,
"Sports": sports_keywords,
"Entertainment": media_keywords,
"Manufacturing": manufacturing_keywords,
"Automobile": automobile_keywords,
"Telecom": telecom_keywords,
"Digital World": digital_world_keywords,
"Technology": technology_keywords,
"Healthcare": healthcare_keywords,
"Education": education_keywords,
"Energy": energy_keywords,
"Retail": retail_keywords,
"Hospitality": hospitality_keywords,
"Real Estate": real_estate_keywords,
"Agriculture": agriculture_keywords,
"Environment": environment_keywords,
"Art & Culture": art_culture_keywords,
"Travel": travel_keywords,
"Fashion": fashion_keywords,
"Architecture": architecture_keywords,
"Aviation": aviation_keywords,
"Gaming": gaming_keywords,
"Food & Beverage": food_beverage_keywords,
"Fitness": fitness_keywords,
"Pharmaceuticals": pharmaceuticals_keywords,
"Music": music_keywords,
}