analysis for the movie graph matrix discreplancy

main
Luca Lombardo 3 years ago
parent b1b2d4ccd1
commit 329a1f84bc

@ -1,3 +1,4 @@
#!/usr/bin/env python3
import os import os
import matplotlib.pyplot as plt import matplotlib.pyplot as plt
import numpy as np import numpy as np

@ -1,11 +1,12 @@
#!/usr/bin/env python3
import os import os
import matplotlib.pyplot as plt import matplotlib.pyplot as plt
import numpy as np import numpy as np
import pandas as pd import pandas as pd
dfs = { dfs = {
i: pd.read_csv(f"top_movies_{i:02d}_c.txt", sep='\t', usecols=[1], names=["actor"]) i: pd.read_csv(f"top_movies_{i:02d}_c.txt", sep='\t', usecols=[1], names=["movie"])
for i in [5] + list(range(10, 71, 10))} for i in [500, 1000, 5000, 10000, 25000, 50000, 75000, 100000]}
sets = {i: set(df["movie"]) for i, df in dfs.items()} sets = {i: set(df["movie"]) for i, df in dfs.items()}
diff = [] diff = []

Loading…
Cancel
Save