File size: 1,146 Bytes
c1e3e0a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
import pandas as pd
import streamlit as st
import datetime as dt
from datetime import datetime

repo_data = pd.read_csv('repo_data2.csv', sep = ';')

repo_data = repo_data.rename(columns={
    'name': 'Name',
    'license': 'License',
    'full_name': 'Full Name',
    'description': 'Github Description',
    'categories': 'Category',
    'topics': 'Github Topics',
    'platforms': 'Platforms',
    'main_prog_language': 'Main Programming Language',
    'programming_languages': 'Programming Languages used',
    'technologies': 'Techniques used',
    'natural_languages': 'Languages Available'
})

repo_data = repo_data.map(lambda x: 'None' if x == None or pd.isna(x) else x)

parse_to_list = lambda x: x.split('//') if isinstance(x, str) else x

extract_unique = lambda series: pd.Series([item for sublist in series\
                if isinstance(sublist, list) for item in sublist]).unique()
filter = lambda options: lambda series: all(f in series for f in options) \
    if isinstance(series, list) else False

parse_date = lambda string: datetime.strptime(string[:10], '%Y-%m-%d').date().strftime('%B %d, %Y')