I need your help, can anyone tells me that what this part of code is doing?
if line[-6:] == '[edit]':
state = line[:-6]
and
town = line[:(line.index('(')-1)]
the whole code is :
def get_list_of_university_towns():
'''Returns a DataFrame of towns and the states they are in from the
university_towns.txt list. The format of the DataFrame should be:
DataFrame( [ ["Michigan", "Ann Arbor"], ["Michigan", "Yipsilanti"] ],
columns=["State", "RegionName"] )
The following cleaning needs to be done:
1. For "State", removing characters from "[" to the end.
2. For "RegionName", when applicable, removing every character from " (" to the end.
3. Depending on how you read the data, you may need to remove newline character '\n'. '''
with open('university_towns.txt') as file:
data = []
for line in file:
data.append(line[:-1])
# print(data)
state_town = []
for line in data:
if line[-6:] == '[edit]':
state = line[:-6]
# print(state)
elif '(' in line:
town = line[:(line.index('(')-1)]
# print(town)
state_town.append([state,town])
else:
town = line.rstrip()
state_town.append([state,town])
# print(state_town)
ans = pd.DataFrame(state_town, columns = ['State','RegionName'])
return ans
get_list_of_university_towns()