Compare commits
2 commits
79319cce2d
...
2e38ea848e
Author | SHA1 | Date | |
---|---|---|---|
2e38ea848e | |||
19ceaca42b |
3 changed files with 20 additions and 0 deletions
|
@ -1,2 +1,3 @@
|
||||||
# copbird-sna
|
# copbird-sna
|
||||||
|
|
||||||
|
This project uses pandas - either run `pip install pandas` to install the needed package or run these files in a conda-enviroment.
|
||||||
|
|
11
src/create_dataset.py
Normal file
11
src/create_dataset.py
Normal file
|
@ -0,0 +1,11 @@
|
||||||
|
import pandas as pd
|
||||||
|
|
||||||
|
tweets_path = "../raw_data/tweets.csv"
|
||||||
|
|
||||||
|
tweets = pd.read_csv(tweets_path)
|
||||||
|
|
||||||
|
# TODO extract mentions from tweets
|
||||||
|
|
||||||
|
# TODO generate cooccurence matrix
|
||||||
|
|
||||||
|
# TODO save cooccurence matrix
|
8
src/create_id_list.py
Normal file
8
src/create_id_list.py
Normal file
|
@ -0,0 +1,8 @@
|
||||||
|
import pandas as pd
|
||||||
|
|
||||||
|
tweets_path = "../raw_data/tweets.csv"
|
||||||
|
|
||||||
|
tweets = pd.read_csv(tweets_path)
|
||||||
|
|
||||||
|
for id in tweets.id:
|
||||||
|
print(id)
|
Loading…
Reference in a new issue