first commit

This commit is contained in:
rnsrk 2024-11-12 03:37:02 +01:00
commit daa1115964
10 changed files with 284 additions and 0 deletions

2
.gitignore vendored Normal file
View file

@ -0,0 +1,2 @@
.venv
data

120
app.py Normal file
View file

@ -0,0 +1,120 @@
from flask import Flask, render_template, redirect, url_for
import pandas as pd
from charts.charts import bar_chart, bar_chart_with_special_legend, point_chart, pie_chart
app = Flask(__name__)
# Read the CSV file
def translate_csv(file, translation_dict):
with open(file, 'r') as f:
text = f.read()
for key, value in translation_dict.items():
text = text.replace(key, value)
with open('data/umfrage2survey.csv', 'w') as f:
f.write(text)
translation_dict = {
'Wie sind Sie auf WissKI aufmerksam geworden?': 'How did you hear about WissKI?',
'In welchem Bereich verwenden Sie WissKI?': 'In which area do you use WissKI?',
'Wie lange arbeiten Sie mit WissKI?': 'How long do you work with WissKI?',
'Bedeutung von Softwarefeatures und Eigenschaften': 'Importance of software features and properties',
'In welcher Rolle benutzen Sie WissKI?': 'In which role do you use WissKI?',
'Haben Sie Erfahrung mit anderen Forschungsdaten-Management-Systemen?': 'Do you have experience with other research data management systems?',
'Haben Sie Zugriff auf kompetenten IT- und Systemadministrationssupport innerhalb Ihres Projektes bzw. Institution?': 'Do you have access to competent IT and system administration support within your project or institution?',
'Arbeitet Ihre Institution/ Unternehmen das erste Mal mit WissKI?': 'Is this the first time your institution/company has worked with WissKI?',
'Wie viele Stunden stehen Ihnen für die Arbeit mit WissKI wöchentlich zur Verfügung?': 'How many hours a week do you have available for working with WissKI?',
'Welchen Community-Angeboten haben Sie mindestens einmal wahrgenommen?': 'Which community offers have you used at least once?',
'Im Verhältnis zu anderen Forschungsdaten-Management-Systemen verorte ich die Qualität von WissKI als...': 'In relation to other research data management systems, I classify the quality of WissKI as...',
'Wie wahrscheinlich ist es, dass Sie WissKI als Forschungsdaten-Management-System weiterempfehlen?':'How likely is it that you would recommend WissKI as a research data management system?'
}
translate_csv('data/Community-Umfrage.csv', translation_dict)
df = pd.read_csv('data/umfrage2survey.csv', encoding='utf8')
#df = pd.read_csv('data/Community-Umfrage.csv', encoding='utf8')
plots = {}
# Normal bar charts
# 1 Wie sind Sie auf WissKI aufmerksam geworden?
# 2 In welchem Bereich verwenden Sie WissKI?
# 25 Haben Sie Zugriff auf kompetenten IT- und Systemadministrationssupport innerhalb Ihres Projektes bzw. Institution?
# 26 Arbeitet Ihre Institution/ Unternehmen das erste Mal mit WissKI?
bar_charts = [1,2,25,26]
for chart in bar_charts:
question_data = df.iloc[:, chart]
question_plot = bar_chart(question_data, question_data.name)
plots[chart] = (question_data.name, question_plot)
# Cleaned pie charts
# 23 In welcher Rolle benutzen Sie WissKI?
question_data = df.iloc[:, 23]
for index, value in question_data.items():
new_value = value.split(' (')[0]
question_data[index] = new_value
question_plot = pie_chart(question_data, question_data.name)
plots[3] = (question_data.name, question_plot)
# Normal Pie charts
# 3 Wie lange arbeiten Sie mit WissKI?
# 24 Haben Sie Erfahrung mit anderen Forschungsdaten-Management-Systemen?
# 27 Wie viele Stunden stehen Ihnen für die Arbeit mit WissKI wöchentlich zur Verfügung?
# 28 Welchen Community-Angeboten haben Sie mindestens einmal wahrgenommen?
pie_charts = [3,24,27,28]
for chart in pie_charts:
question_data = df.iloc[:, chart]
question_plot = pie_chart(question_data, question_data.name)
plots[chart] = (question_data.name, question_plot)
# Point charts
# 9-22 Software Features
median_values = df.iloc[:, 9:23].median()
median_values_cleaned = pd.Series(name='Software Features')
for index, value in median_values.items():
new_index = index.split(' [')[1].split(']')[0]
median_values_cleaned[new_index] = value
point_plot = point_chart(median_values_cleaned, 'Software Features')
plots[9] = ('Software Features', point_plot)
# Bar charts with median
# 29 Im Verhältnis zu anderen Forschungsdaten-Management-Systemen verorte ich die Qualität von WissKI als...
bar_charts_with_median = [29]
for chart in bar_charts_with_median:
question_data = df.iloc[:, chart]
question_plot = bar_chart_with_special_legend(question_data, question_data.name, 'quality')
plots[chart] = (question_data.name, question_plot)
bar_charts_with_median = [31]
for chart in bar_charts_with_median:
question_data = df.iloc[:, chart]
question_plot = bar_chart_with_special_legend(question_data, question_data.name, 'recommendation')
plots[chart] = (question_data.name, question_plot)
plots = dict(sorted(plots.items(), key=lambda x: x[0]))
# Generate list of charts
charts = [{'id': i+1, 'title': plots[col][0], 'data': plots[col][1]} for i, col in enumerate(plots.keys())]
@app.route('/')
def index():
return redirect(url_for('show_chart', chart_id=1))
@app.route('/chart/<int:chart_id>')
def show_chart(chart_id):
chart = next((c for c in charts if c['id'] == chart_id), None)
if not chart:
return redirect(url_for('index'))
plot_url = chart['data']
prev_id = chart_id - 1 if chart_id > 1 else len(charts)
next_id = chart_id + 1 if chart_id < len(charts) else 1
return render_template('chart.html', plot_url=plot_url, prev_id=prev_id, next_id=next_id, title=chart['title'])
if __name__ == '__main__':
app.run(debug=True)

1
charts/__init__.py Normal file
View file

@ -0,0 +1 @@
# This file can be empty but is required to make the charts directory a package

Binary file not shown.

Binary file not shown.

Binary file not shown.

104
charts/charts.py Normal file
View file

@ -0,0 +1,104 @@
import seaborn as sns
import matplotlib.pyplot as plt
import io
import base64
import pandas as pd
def bar_chart(data, title):
data = data.str.split(';').explode().value_counts()
fig, ax = plt.subplots(figsize=(12,6))
palette = sns.color_palette("husl", len(data))
sns.barplot(x=data.index, y=data.values, ax=ax, hue=data.index, palette=palette, legend=False)
ax.set_xlabel('Answer')
ax.set_ylabel('Count')
# Rotate the x-axis labels and set their horizontal alignment
for tick in ax.get_xticklabels():
tick.set_rotation(45)
tick.set_horizontalalignment('right')
tick.set_fontsize(12)
fig.tight_layout()
img = io.BytesIO()
fig.savefig(img, format='png', dpi=300, bbox_inches='tight', pad_inches=0.5)
img.seek(0)
plot_url = base64.b64encode(img.getvalue()).decode('utf8')
plt.close()
return plot_url
def bar_chart_with_special_legend(data, title, scale='recommendation'):
if scale == 'recommendation':
data = data.map({1:'not likely', 2:'less likely', 3:'not sure', 4:'more likely', 5:'definitely'})
# create a value counts series
data_counts = data.value_counts()
fig, ax = plt.subplots(figsize=(12,6))
palette = sns.color_palette("husl", 5)
sns.barplot(x=data_counts.index, y=data_counts.values, ax=ax, hue=data_counts.index, palette=palette)
ax.set_xlabel('Answer')
ax.set_ylabel('Count')
# set y-axis to only have integer values
ax.yaxis.set_major_locator(plt.MultipleLocator(1.0))
# Rotate the x-axis labels and set their horizontal alignment
for tick in ax.get_xticklabels():
tick.set_rotation(45)
tick.set_horizontalalignment('right')
tick.set_fontsize(12)
fig.tight_layout()
img = io.BytesIO()
fig.savefig(img, format='png', dpi=300, bbox_inches='tight', pad_inches=0.5)
img.seek(0)
plot_url = base64.b64encode(img.getvalue()).decode('utf8')
plt.close()
return plot_url
def pie_chart(data, title):
data = data.str.split(';').explode().value_counts()
fig, ax = plt.subplots(figsize=(12,6))
ax.pie(data.values, labels=data.index, autopct='%1.1f%%')
fig.tight_layout()
img = io.BytesIO()
fig.savefig(img, format='png', dpi=300, bbox_inches='tight', pad_inches=0.5)
img.seek(0)
plot_url = base64.b64encode(img.getvalue()).decode('utf8')
plt.close()
return plot_url
def point_chart(data, title):
# Count the occurrences of each value
# Map the x-axis values to the appropriate string
data = data.map({1:'not important', 2:'less important', 3:'important', 4:'more important', 5:'mandatory'})
# Create a figure and axis
fig, ax = plt.subplots()
# Plot your data
for answer, value in data.items():
ax.plot([value], [answer], marker='o')
# Set the x-axis ticks and labels
ax.set_xticks(list(set(data.values)))
ax.set_xticklabels(list(set(data.values)), rotation=45)
# Set the y-axis limits to remove the axis
ax.set_yticks(list(data.keys()))
# Set the font size of the y-axis
for tick in ax.get_yticklabels():
tick.set_fontsize(9)
fig.tight_layout()
img = io.BytesIO()
fig.savefig(img, format='png', dpi=300, bbox_inches='tight', pad_inches=0.5)
img.seek(0)
plot_url = base64.b64encode(img.getvalue()).decode('utf8')
plt.close()
return plot_url

23
static/styles.css Normal file
View file

@ -0,0 +1,23 @@
body {
font-family: Arial, sans-serif;
text-align: center;
}
img {
width: 80%;
height: auto;
}
div {
margin-top: 20px;
}
a {
text-decoration: none;
font-size: 20px;
}
.navigation {
display: flex;
justify-content: space-around;
}

34
templates/chart.html Normal file
View file

@ -0,0 +1,34 @@
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<title>{{ title }}</title>
<link rel="stylesheet" href="{{ url_for('static', filename='styles.css') }}">
<style>
html, body {
height: 100%;
}
body {
display: flex;
align-items: center;
justify-content: center;
}
</style>
</head>
<body>
<div>
<div>
<h1>{{ title }}</h1>
<img src="data:image/png;base64,{{ plot_url }}" alt="Chart">
</div>
<div class="navigation">
<a href="{{ url_for('show_chart', chart_id=prev_id) }}">&#8592; Previous</a>
<a href="{{ url_for('show_chart', chart_id=next_id) }}">Next &#8594;</a>
</div>
</div>
</body>
</html>