|
|
@ -1,11 +1,12 @@
|
|
|
|
|
|
|
|
#!/usr/bin/env python3
|
|
|
|
import os
|
|
|
|
import os
|
|
|
|
import matplotlib.pyplot as plt
|
|
|
|
import matplotlib.pyplot as plt
|
|
|
|
import numpy as np
|
|
|
|
import numpy as np
|
|
|
|
import pandas as pd
|
|
|
|
import pandas as pd
|
|
|
|
|
|
|
|
|
|
|
|
dfs = {
|
|
|
|
dfs = {
|
|
|
|
i: pd.read_csv(f"top_movies_{i:02d}_c.txt", sep='\t', usecols=[1], names=["actor"])
|
|
|
|
i: pd.read_csv(f"top_movies_{i:02d}_c.txt", sep='\t', usecols=[1], names=["movie"])
|
|
|
|
for i in [5] + list(range(10, 71, 10))}
|
|
|
|
for i in [500, 1000, 5000, 10000, 25000, 50000, 75000, 100000]}
|
|
|
|
sets = {i: set(df["movie"]) for i, df in dfs.items()}
|
|
|
|
sets = {i: set(df["movie"]) for i, df in dfs.items()}
|
|
|
|
|
|
|
|
|
|
|
|
diff = []
|
|
|
|
diff = []
|
|
|
|