import numpy as np
import pandas as pd
import ijson
import time
import csv
import numpy as np
from decimal import Decimal
import matplotlib as mpl
import matplotlib.pyplot as plt
import networkx as nx
from itables import init_notebook_mode
from libs.backend import * # Custom backend functionalities
from libs.frontend import * # Custom frontend to display backend functionalities
import ipywidgets as widgets
import warnings

# Make sure that plots are in-line
%matplotlib inline
# Make the tables interactive
init_notebook_mode(all_interactive=True)
# Set plot grid parameter
mpl.rcParams['grid.linestyle'] = "-" 
# Suppress DeprecationWarnings from IpyWidgets
warnings.filterwarnings('ignore')

start = time.process_time()

PAPER = []
Author = []
count = 0

with open('dblp.v12.json', "rb") as f, open("output.csv", "w", newline="") as csvfile:
    fieldnames = ['id', 'title', 'year', 'author_name', 'author_org', 'author_id', 'n_citation', 'doc_type',
                  'reference_count', 'references', 'venue_id', 'venue_name', 'venue_type', 'doi', 'keyword','volume','issue','publisher',
                  'weight', 'indexed_keyword', 'inverted_index']
    writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
    writer.writeheader()

    for i, element in enumerate(ijson.items(f, "item")):
        paper = {}
        paper['id'] = element['id']
        paper['title'] = element['title']

        year = element.get('year')
        if year:
            paper['year'] = year
        else:
            paper['year'] = np.nan

        author = element.get('authors')
        if author:
            Author = element['authors']
            author_name = []
            author_org = []
            author_id = []

            for i in Author:
                if 'name' in i and 'id' in i and 'org' in i:
                    author_name.append(str(i['name']))  # Convert to string
                    author_id.append(str(i['id']))
                    author_org.append(str(i['org']))
                else:
                    author_name.append(str(np.nan))  # Convert to string
                    author_id.append(str(np.nan))
                    author_org.append(str(np.nan))

            paper['author_name'] = ';'.join(author_name)
            paper['author_org'] = ';'.join(author_org)
            paper['author_id'] = ';'.join(author_id)

        n_citation = element.get('n_citation')
        if n_citation:
            paper['n_citation'] = n_citation
        else:
            paper['n_citation'] = np.nan

        doc_type = element.get('doc_type')
        if doc_type:
            paper['doc_type'] = doc_type
        else:
            paper['doc_type'] = np.nan

        references = element.get('references')
        if references:
            paper['reference_count'] = len(references)
            paper['references'] = ';'.join(str(int(r)) for r in references)
        else:
            paper['references'] = np.nan

        venue = element.get('venue')
        if venue:
            if 'id' in venue and 'raw' in venue and 'type' in venue:
                paper['venue_id'] = str(venue['id'])
                paper['venue_name'] = venue['raw']
                paper['venue_type'] = venue['type']
            else:
                paper['venue_id'] = np.nan
                paper['venue_name'] = np.nan
                paper['venue_type'] = np.nan
        else:
            paper['venue_id'] = np.nan
            paper['venue_name'] = np.nan
            paper['venue_type'] = np.nan

        doi = element.get('doi')
        if doi:
            paper['doi'] = f"https://doi.org/{doi}"
        else:
            paper['doi'] = np.nan

        fos = element.get('fos')
        if fos:
            fosunparsed = element['fos']
            keyword = []
            weight = []

            for i in fosunparsed:
                if isinstance(i['w'], (int, float, Decimal)):
                    keyword.append(str(i['name']))  # Convert to string
                    weight.append(str(i['w']))
                else:
                    keyword.append(str(np.nan))  # Convert to string
                    weight.append(str(np.nan))

        else:
            keyword = []
            weight = []

        paper['keyword'] = ';'.join(keyword)
        paper['weight'] = ';'.join(weight)

        indexed_abstract = element.get('indexed_abstract')
        if indexed_abstract:
            indexed_abstracts = indexed_abstract.get('InvertedIndex')
            inverted_vector = []
            keywords = []

            for i in indexed_abstracts:
                if i:
                    keywords.append(str(i))  # Convert to string
                    inverted_vector.append(str(indexed_abstracts[i]))  # Convert to string
        else:
            keywords = []
            inverted_vector = []

        paper['indexed_keyword'] = ';'.join(keywords)
        paper['inverted_index'] = ';'.join(inverted_vector)
        
        publisher= element.get('publisher')
        if publisher:
            paper['publisher']=publisher
        else:
            paper['publisher']=np.nan
        volume = element.get('volume')
        if volume:
            paper['volume']=volume
        else:
            paper['volume']=np.nan
        issue = element.get('issue')
        if issue:
            paper['issue']=issue
        else:
            paper['issue']=np.nan
        count += 1
        writer.writerow(paper)

        if count % 4800 == 0:
            print(f"{count}:{round((time.process_time() - start), 2)}s ", end="")

# Load data into a Pandas DataFrame
df = pd.read_csv('output.csv')

# Sort by number of citations and get the top 10,000 papers
top_papers = df.sort_values('n_citation', ascending=False).head(10000)

# Citation Graph Nodes
citation_nodes = top_papers['id'].tolist()

# Collaboration Graph Nodes
collaboration_nodes = set()

# Before applying the lambda, ensure NaN values are handled, e.g., by converting to a string
top_papers['author_id'] = top_papers['author_id'].fillna('')

# Now applying the lambda function
top_papers['author_id'].str.split(';').apply(lambda x: collaboration_nodes.update(x) if isinstance(x, list) else None)
# Empty and NaN ids are dropped
collaboration_nodes.remove('')
collaboration_nodes.remove('nan')

# Create graphs
citation_graph = nx.DiGraph()
collaboration_graph = nx.Graph()

# Add nodes to graphs
citation_graph.add_nodes_from(citation_nodes)
collaboration_graph.add_nodes_from(collaboration_nodes)

# Create a dictionary with authors ids as keys and authors names as values
authors_names = dict()
top_papers.apply(lambda row: authors_names.update(dict(zip(row['author_id'].split(';'),row['author_name'].split(';')))) if not(pd.isna(row['author_name'])) else None, axis = 1)
# NaN name is dropped
del authors_names['nan']

# Add papers titles and authors names to node attributes
nx.set_node_attributes(citation_graph, dict(zip(top_papers.id, top_papers.title)), name = 'title')
nx.set_node_attributes(collaboration_graph, authors_names, name = 'author_name')

# Add edges to Citation Graph
for _, row in top_papers.iterrows():
    if pd.notna(row['references']):
        cited_papers = [int(x) for x in row['references'].split(';') if x.isdigit()]
        for cited in cited_papers:
            if cited in citation_nodes:
                citation_graph.add_edge(row['id'], cited)

# Add edges to Collaboration Graph with a simple weighting scheme
edges_labels = dict()
for _, row in top_papers.iterrows():
    authors = str(row['author_id']).split(';') if pd.notnull(row['author_id']) else []
    authors = [obj for obj in authors if obj != 'nan']
    for i, author_i in enumerate(authors):
        for author_j in authors[i+1:]:
            if author_i and author_j:  # Ensure author_i and author_j are not empty strings
                if collaboration_graph.has_edge(author_i, author_j):
                    collaboration_graph[author_i][author_j]['weight'] += 1
                else:
                    collaboration_graph.add_edge(author_i, author_j, weight=1)
                    edges_labels.update({(author_i,author_j):row['title']})

# Associate to each edge of the collaboration graph the name of the correspondent paper
nx.set_edge_attributes(collaboration_graph, edges_labels, name = 'paper')

# Identify the largest connected component in the collaboration graph
largest_collaboration_cc = max(nx.connected_components(collaboration_graph), key=len)
subgraph_collaboration_graph = collaboration_graph.subgraph(largest_collaboration_cc)

# Visualizing the citation graph
plt.figure(figsize=(12, 8))
pos = nx.spring_layout(citation_graph)
nx.draw(citation_graph, pos, node_size=10, arrows=True, edge_color='red', with_labels=False)
plt.title("Citation Graph")
plt.show()

# Visualizing the collaboration graph
plt.figure(figsize=(12, 8))
pos = nx.spring_layout(collaboration_graph)
nx.draw(collaboration_graph, pos, node_size=10, edge_color='gray', with_labels=False)
plt.title("Collaboration Graph")
plt.show()

# Visualizing the Largest Connected Component in the Collaboration Graph
plt.figure(figsize=(12, 8))
pos = nx.spring_layout(subgraph_collaboration_graph)
nx.draw(subgraph_collaboration_graph, pos, node_size=10, edge_color='gray', with_labels=False)
plt.title("Largest Connected Component in the Collaboration Graph")
plt.show()

# Assuming citation_graph and collaboration_graph are already created NetworkX graph objects
nx.write_graphml(citation_graph, "citation_graph.graphml")
nx.write_graphml(collaboration_graph, "collaboration_graph.graphml")
nx.write_graphml(subgraph_collaboration_graph, "subgraph_collaboration_graph.graphml")

citation_path = 'citation_graph.graphml'
collaboration_path = 'collaboration_graph.graphml'
subcollaboration_path = 'subgraph_collaboration_graph.graphml'

# Load the citation graph from GraphML file
citation_graph = nx.read_graphml(citation_path)

# Load the collaboration graph from GraphML file
collaboration_graph = nx.read_graphml(collaboration_path)

# Load the subgraph collaboration graph from GraphML file
subgraph_collaboration_graph = nx.read_graphml(subcollaboration_path)

# CITATION GRAPH
first_funct = widgets.interactive(visual_1, 
                          {'manual': True},
                          G = widgets.Dropdown(options=[('Citation Graph',citation_graph),('Collaboration Graph',collaboration_graph),('Collaboration Graph (Largest Component)',subgraph_collaboration_graph)], description='Graph:'),
                          k = widgets.IntSlider(min = 2, max = 50, step = 1, value = 20, description = 'Top Authors:'))
first_funct.children[-1].layout.height = '1450px'
display(first_funct)

# COLLABORATION GRAPH
first_funct = widgets.interactive(visual_1, 
                          {'manual': True},
                          G = widgets.Dropdown(options=[('Citation Graph',citation_graph),('Collaboration Graph',collaboration_graph),('Collaboration Graph (Largest Component)',subgraph_collaboration_graph)], description='Graph:'),
                          k = widgets.IntSlider(min = 2, max = 50, step = 1, value = 20, description = 'Top Authors:'))
first_funct.children[-1].layout.height = '1450px'
display(first_funct)

finder = widgets.interactive(visual_id_finder, 
                          {'manual': True},
                          G = widgets.Dropdown(options=[('Citation Graph',citation_graph),('Collaboration Graph',collaboration_graph),('Collaboration Graph (Largest Component)',subgraph_collaboration_graph)], description='Graph:'),
                          input_str = widgets.Text(value='',placeholder='Type name or title',description='Name/Title:'))
finder.children[-1].layout.height = '200px'
display(finder)

second_funct = widgets.interactive(visual_2, 
                          {'manual': True},
                          G = widgets.Dropdown(options=[('Citation Graph',citation_graph),('Collaboration Graph',collaboration_graph),('Collaboration Graph (Largest Component)',subgraph_collaboration_graph)], description='Graph:'),
                          v = widgets.Text(value='',placeholder='Type node ID',description='Node ID:'))
second_funct.children[-1].layout.height = '200px'
display(second_funct)

N_slider = widgets.IntSlider(min = 2, max = 5000, step = 1, value = 500, description = 'Top Authors by degree to consider:', layout = widgets.Layout(width='75%'))
drop = widgets.Dropdown(options=[('Collaboration Graph',collaboration_graph),('Collaboration Graph (Largest Component)',subgraph_collaboration_graph)], description='Graph:')

def on_choose_N(d):
    if drop.value == collaboration_graph:
        N_slider.max = len(list(collaboration_graph.nodes()))
    else:
        N_slider.max = len(list(subgraph_collaboration_graph.nodes()))
    return N_slider.max

widgets.dlink((drop, "value"), (N_slider, "max"), on_choose_N)

third_funct = widgets.interactive(visual_3, 
                          {'manual': True},
                          G = drop,
                          a1 = widgets.Text(value='',placeholder='Type starting node ID',description='Starting Node ID:'),
                          a = widgets.Textarea(value = '', placeholder = 'Type the nodes IDs separated by a blank space', description = 'List of nodes to walk through:'),
                          an = widgets.Text(value='',placeholder='Type ending node ID',description='Ending Node ID:'),
                          N = N_slider)
third_funct.children[-1].layout.height = '900px'
display(third_funct)

N_slider = widgets.IntSlider(min = 2, max = 5000, step = 1, value = 500, description = 'Top Authors by degree to consider:', layout = widgets.Layout(width='75%'))
drop = widgets.Dropdown(options=[('Collaboration Graph',collaboration_graph),('Collaboration Graph (Largest Component)',subgraph_collaboration_graph)], description='Graph:')

def on_choose_N(d):
    if drop.value == collaboration_graph:
        N_slider.max = len(list(collaboration_graph.nodes()))
    else:
        N_slider.max = len(list(subgraph_collaboration_graph.nodes()))
    return N_slider.max

widgets.dlink((drop, "value"), (N_slider, "max"), on_choose_N)

fourth_funct = widgets.interactive(visual_4, 
                          {'manual': True},
                          G = drop,
                          authorA = widgets.Text(value='',placeholder='Type first node ID',description='First Node ID:'),
                          authorB = widgets.Text(value = '', placeholder = 'Type second node ID', description = 'Second Node ID:'),
                          N = N_slider)
fourth_funct.children[-1].layout.height = '1000px'
display(fourth_funct)

N_slider = widgets.IntSlider(min = 2, max = 5000, step = 1, value = 500, description = 'Top Authors by degree to consider:', layout = widgets.Layout(width='75%'))
drop = widgets.Dropdown(options=[('Citation Graph',citation_graph),('Collaboration Graph',collaboration_graph),('Collaboration Graph (Largest Component)',subgraph_collaboration_graph)], description='Graph:')

def on_choose_N(d):
    if drop.value == collaboration_graph:
        N_slider.max = len(list(collaboration_graph.nodes()))
    elif drop.value == subgraph_collaboration_graph:
        N_slider.max = len(list(subgraph_collaboration_graph.nodes()))
    else:
        N_slider.max = len(list(citation_graph.nodes()))
    return N_slider.max

widgets.dlink((drop, "value"), (N_slider, "max"), on_choose_N)

fifth_funct = widgets.interactive(visual_5, 
                          {'manual': True},
                          G = drop,
                          paper_1 = widgets.Text(value='',placeholder='Type first node ID',description='First Node ID:'),
                          paper_2 = widgets.Text(value='',placeholder='Type second node ID',description='Second Node ID:'),
                          N = N_slider)
fifth_funct.children[-1].layout.height = '1700px'
display(fifth_funct)

# # Question 1
# echo "Is there any node that acts as an important "'connector'" between the different parts of the graph?"
# grep -o 'target="[0-9]*"' citation_graph.graphml | cut -d'"' -f2 | sort | uniq -c | sort -nr | head -n 1
# # Question 2
# echo "How does the degree of citation vary among the graph nodes?"
# max=$(grep -o 'target="[0-9]*"' citation_graph.graphml | cut -d'"' -f2 | sort | uniq -c | sort -nr | awk '{print "Ranges from " $1}' | head -n 1)
# min=$(grep -o 'target="[0-9]*"' citation_graph.graphml | cut -d'"' -f2 | sort | uniq -c | sort -nr | awk '{print "to " $1}' | tail -n 1)
# echo "Ranges from $max to $min"
# # Question 3
# echo "What is the average length of the shortest path among nodes?"

# # pip install networkx
# python -c'
# import networkx as nx

# # Load the graph from a GraphML file
# G = nx.read_graphml("citation_graph.graphml")
# sum = 0
# # Check if the graph is strongly connected
# if nx.is_strongly_connected(G):
#     average_distance = nx.average_shortest_path_length(G)
#     print(f"Average shortest path length: {average_distance}")
# else:
#     print("Graph is not strongly connected.")

#     # Calculate average shortest path length for each connected component
#     components = list(nx.strongly_connected_components(G))
#     for i, component in enumerate(components, start=1):
#         subgraph = G.subgraph(component)
#         component_average_distance = nx.average_shortest_path_length(subgraph)
#         sum = sum + component_average_distance
#     print(f"Average shortest path length: {sum/i}")
# '

def skillScore():
    # Line 1 input: (N, M and S)
    N, M, S = input("Enter N, M and S values space separated: ").split(" ")
    N, M, S = int(N), int(M), int(S)

    # Line 2 input: Set of skills (S)
    skillsReq = input("Enter skills space separated: ").split(" ")

    # Line 3 input: Player id, Skill and Skill score

    skillsAndSkillScore = {}
    # skillsAndSkillScore = []

    for i in range(N):
        playerId = int(input())
        for ii in range(S):
            playerSkill, skillScore = input().split()
            if playerSkill in skillsAndSkillScore:
                skillsAndSkillScore[playerSkill].append(int(skillScore))
            else:
                skillsAndSkillScore[playerSkill] = [int(skillScore)]

    teamScore = 0

    # Sort Scores

    for key, _ in skillsAndSkillScore.items():
        skillsAndSkillScore[key] = sorted(skillsAndSkillScore[key], reverse=True)

    print("Sorted scores are: ", skillsAndSkillScore)

    for skill in skillsReq:
        if skill in skillsAndSkillScore:
            if len(skillsAndSkillScore[skill]) <= 0:
                teamScore += 0
            else:
                score = skillsAndSkillScore[skill].pop(0)
                teamScore += score
        else:
            teamScore += 0
        print("Skills and skill score is: ", skillsAndSkillScore)
        print("Team score is: ", teamScore)

    return teamScore

#Inserting input 1
out1 = skillScore()
out1

Sorted scores are:  {'BSK': [98], 'ATH': [52, 14], 'HCK': [95, 82, 9], 'FTB': [90], 'TEN': [85], 'RGB': [46], 'SWM': [59, 34, 16], 'VOL': [32], 'SOC': [41]}
Skills and skill score is:  {'BSK': [98], 'ATH': [52, 14], 'HCK': [95, 82, 9], 'FTB': [90], 'TEN': [85], 'RGB': [46], 'SWM': [34, 16], 'VOL': [32], 'SOC': [41]}
Team score is:  59
Skills and skill score is:  {'BSK': [98], 'ATH': [52, 14], 'HCK': [95, 82, 9], 'FTB': [90], 'TEN': [85], 'RGB': [46], 'SWM': [34, 16], 'VOL': [], 'SOC': [41]}
Team score is:  91
Skills and skill score is:  {'BSK': [98], 'ATH': [14], 'HCK': [95, 82, 9], 'FTB': [90], 'TEN': [85], 'RGB': [46], 'SWM': [34, 16], 'VOL': [], 'SOC': [41]}
Team score is:  143
Skills and skill score is:  {'BSK': [98], 'ATH': [14], 'HCK': [95, 82, 9], 'FTB': [90], 'TEN': [85], 'RGB': [46], 'SWM': [34, 16], 'VOL': [], 'SOC': [41]}
Team score is:  143
Skills and skill score is:  {'BSK': [98], 'ATH': [14], 'HCK': [95, 82, 9], 'FTB': [90], 'TEN': [85], 'RGB': [46], 'SWM': [34, 16], 'VOL': [], 'SOC': [41]}
Team score is:  143
Skills and skill score is:  {'BSK': [], 'ATH': [14], 'HCK': [95, 82, 9], 'FTB': [90], 'TEN': [85], 'RGB': [46], 'SWM': [34, 16], 'VOL': [], 'SOC': [41]}
Team score is:  241
Skills and skill score is:  {'BSK': [], 'ATH': [14], 'HCK': [82, 9], 'FTB': [90], 'TEN': [85], 'RGB': [46], 'SWM': [34, 16], 'VOL': [], 'SOC': [41]}
Team score is:  336
Skills and skill score is:  {'BSK': [], 'ATH': [14], 'HCK': [82, 9], 'FTB': [90], 'TEN': [85], 'RGB': [46], 'SWM': [34, 16], 'VOL': [], 'SOC': [41]}
Team score is:  336
Skills and skill score is:  {'BSK': [], 'ATH': [14], 'HCK': [82, 9], 'FTB': [90], 'TEN': [85], 'RGB': [46], 'SWM': [16], 'VOL': [], 'SOC': [41]}
Team score is:  370
Skills and skill score is:  {'BSK': [], 'ATH': [14], 'HCK': [82, 9], 'FTB': [90], 'TEN': [85], 'RGB': [46], 'SWM': [16], 'VOL': [], 'SOC': [41]}
Team score is:  370

370

#Inserting input 2
out2 = skillScore()
out2

Sorted scores are:  {'BSK': [98, 12], 'HCK': [95, 82, 50, 40, 12, 9], 'ATH': [52, 30, 14], 'VOL': [32, 20, 1], 'SWM': [59, 34, 30, 27, 16, 11], 'FTB': [90, 12], 'RGB': [80, 46, 7], 'TEN': [85, 82], 'SOC': [41]}
Skills and skill score is:  {'BSK': [98, 12], 'HCK': [95, 82, 50, 40, 12, 9], 'ATH': [52, 30, 14], 'VOL': [32, 20, 1], 'SWM': [34, 30, 27, 16, 11], 'FTB': [90, 12], 'RGB': [80, 46, 7], 'TEN': [85, 82], 'SOC': [41]}
Team score is:  59
Skills and skill score is:  {'BSK': [98, 12], 'HCK': [95, 82, 50, 40, 12, 9], 'ATH': [52, 30, 14], 'VOL': [20, 1], 'SWM': [34, 30, 27, 16, 11], 'FTB': [90, 12], 'RGB': [80, 46, 7], 'TEN': [85, 82], 'SOC': [41]}
Team score is:  91
Skills and skill score is:  {'BSK': [98, 12], 'HCK': [95, 82, 50, 40, 12, 9], 'ATH': [30, 14], 'VOL': [20, 1], 'SWM': [34, 30, 27, 16, 11], 'FTB': [90, 12], 'RGB': [80, 46, 7], 'TEN': [85, 82], 'SOC': [41]}
Team score is:  143
Skills and skill score is:  {'BSK': [98, 12], 'HCK': [95, 82, 50, 40, 12, 9], 'ATH': [30, 14], 'VOL': [1], 'SWM': [34, 30, 27, 16, 11], 'FTB': [90, 12], 'RGB': [80, 46, 7], 'TEN': [85, 82], 'SOC': [41]}
Team score is:  163
Skills and skill score is:  {'BSK': [98, 12], 'HCK': [95, 82, 50, 40, 12, 9], 'ATH': [30, 14], 'VOL': [], 'SWM': [34, 30, 27, 16, 11], 'FTB': [90, 12], 'RGB': [80, 46, 7], 'TEN': [85, 82], 'SOC': [41]}
Team score is:  164
Skills and skill score is:  {'BSK': [12], 'HCK': [95, 82, 50, 40, 12, 9], 'ATH': [30, 14], 'VOL': [], 'SWM': [34, 30, 27, 16, 11], 'FTB': [90, 12], 'RGB': [80, 46, 7], 'TEN': [85, 82], 'SOC': [41]}
Team score is:  262
Skills and skill score is:  {'BSK': [12], 'HCK': [82, 50, 40, 12, 9], 'ATH': [30, 14], 'VOL': [], 'SWM': [34, 30, 27, 16, 11], 'FTB': [90, 12], 'RGB': [80, 46, 7], 'TEN': [85, 82], 'SOC': [41]}
Team score is:  357
Skills and skill score is:  {'BSK': [], 'HCK': [82, 50, 40, 12, 9], 'ATH': [30, 14], 'VOL': [], 'SWM': [34, 30, 27, 16, 11], 'FTB': [90, 12], 'RGB': [80, 46, 7], 'TEN': [85, 82], 'SOC': [41]}
Team score is:  369
Skills and skill score is:  {'BSK': [], 'HCK': [82, 50, 40, 12, 9], 'ATH': [30, 14], 'VOL': [], 'SWM': [30, 27, 16, 11], 'FTB': [90, 12], 'RGB': [80, 46, 7], 'TEN': [85, 82], 'SOC': [41]}
Team score is:  403
Skills and skill score is:  {'BSK': [], 'HCK': [82, 50, 40, 12, 9], 'ATH': [30, 14], 'VOL': [], 'SWM': [30, 27, 16, 11], 'FTB': [90, 12], 'RGB': [80, 46, 7], 'TEN': [85, 82], 'SOC': [41]}
Team score is:  403

403

Homework 5 - The eternal significance of publications and citations!¶

1. Data¶

Graphs setup¶

Data pre-processing¶

Data Pre-processing Algorithm¶

Step 1: Load Data and Identify Top 10,000 Papers¶

Step 2: Construct Nodes for Both Graphs¶

Step 3: Construct Edges for Both Graphs¶

Approximating the Most Connected Component¶

Code Implementation:¶

2. Controlling system¶

Functionality 1 - Graph's features¶

Functionality 2 - Nodes' contribution¶

Functionality 3 - Shortest ordered walk¶

Functionality 4 - Disconnecting Graphs¶

Functionality 5 - Exctracting Communities¶

4. Command Line Question (CLQ)¶

5. Algorithmic Questions (AQ)¶

Part A¶

1. Implement an algorithm to solve the described mentioned problem.¶

2. What is the time complexity (the Big O notation) of your solution? Please provide a detailed explanation of how you calculated the time complexity.¶

3. Ask ChatGPT or any other LLM chatbot tool to check your code's time complexity (the Big O notation). Compare your answer to theirs. If the two differ, which one is right? (why?)¶

4. If your algorithm has exponential time complexity, can you provide a polynomial-time version?¶

5. If S = 1 how does the time complexity of an optimal algorithm to solve this problem change?¶

Part B¶

1. Prove or disprove that the problem is NP-complete.¶

2. Write a heuristic in order to approximate the best solution for this problem.¶

3. What is the time complexity of your solution ?¶