Taiwan Stock and OTC Lists by Categories

Ed Chao
1 min readAug 15, 2020
import pandas as pd
import re
def Sticker_list(category):
df = pd.read_html(category)
ticker_list = re.findall("\d+", df[5][0][0])
ticker_list = pd.Series([ticker_list[idx] + '.TW' for idx in range(len(ticker_list))])
return ticker_list
all_S_list = pd.concat([Sticker_list(category) for category in Slist], axis = 1)cols_name = ['Cement', 'Food', 'Plastic', 'Textile', 'EE', 'EA_Cable', 'Chemistry', 'Biomedical', 'Glasses',
'Paper', 'Steel', 'Rubber', 'Cars', 'Semicon', 'Photoelectric', 'Communicate', 'Eparts',
'Evendors', 'Itservice', 'Eothers', 'Construction', 'Shipping', 'Sightseeing', 'Finance', 'Vendors', 'Fuel']
all_S_list.columns = cols_name
## short of computer category
path = 'D:/00_我在管院研究所的日子/99_雜項/'
file1 = '電腦周邊類股.xlsx'
file2 = '台股上市各類股清單.xlsx'
computer_list = pd.read_excel(path + file1, header = None, names = ['Computer'])
all_S_list = pd.concat([all_S_list, computer_list], axis = 1)
all_S_list.to_excel(path + file2, index = False)

********************************************************************
import pandas as pd
import re
def OTCticker_list(category):
df = pd.read_html(category)
ticker_list = re.findall("\d+", df[5][0][0])
ticker_list = pd.Series([ticker_list[idx] + '.TW' for idx in range(len(ticker_list))])
return ticker_list
all_OTC_list = pd.concat([OTCticker_list(category) for category in OTClist], axis = 1)
col_names = ['OFood', 'OPlastic', 'OTextile', 'OEE', 'OEA', 'OChemistry', 'OBiomedical', 'OSteel',
'ORubber', 'OSemicon', 'OComputer', 'OPhotoelectric', 'OCommunicate', 'OEparts', 'OVendors',
'OItservice', 'OEothers', 'OConstruction', 'OShipping', 'OSightseeing', 'OFinance', 'OTrade',
'OFuel', 'OGame', 'OFarm', 'OEvendors', 'OOthers', 'OCompany']
all_OTC_list.columns = col_names
path = 'D:/00_我在管院研究所的日子/99_雜項/'
file = '台股上櫃各類股清單.xlsx'
all_OTC_list.to_excel(path+file, index = False)
all_OTC_list

--

--

Ed Chao

Playground for a old student. Records about learning, life and interesting stuff