Newer
Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
\documentclass[9pt,hyperref,ngerman]{beamer}
\pdfpageattr {/Group << /S /Transparency /I true /CS /DeviceRGB>>}
%\usepackage{beramono}
%\usepackage{pxfonts}
\usepackage[euler-digits]{eulervm}
\usepackage{amsmath}
\usepackage{wasysym}
\usepackage{amsfonts}
\usepackage[ngerman]{babel}
\usepackage[utf8]{inputenc}
\usepackage{graphicx}
\usepackage{bbm} % for getting a nice 1
%\usepackage{animate}
%\usepackage[hyperfootnotes=false,pdfpagelabels,pagebackref,unicode]{hyperref}
%\usepackage[caption=false]{subfig}
\usepackage{placeins}
%\usepackage{tikz}
\usepackage{pstool}
\usepackage{bbold}
\usepackage{ulem}
\usepackage[T1]{fontenc}
\usepackage{biolinum}
\usepackage[T1]{fontenc}
\usepackage[caption=false, labelformat=empty]{subfig}
\pdfpageattr {/Group << /S /Transparency /I true /CS /DeviceRGB>>}
%For mac compatibility
%\graphicspath{{gfx/}}
%\graphicspath{{../gfx/}{./gfx/}}
\EndPreamble
\usetheme[unilogo=uniwue]{FOR1807} % nobody uses page numbers -> FakherMode
\pdfpageattr {/Group << /S /Transparency /I true /CS /DeviceRGB>>}
\newsavebox{\mytmpboxx}
\newcommand{\img}[3]%
{{
%to enable Fakher's mac...
%\immediate\write18{cp ./gfx/#2.eps ./#2.eps}%
\sbox{\mytmpboxx}{\psfragfig*[#1]{#2}{%create the pdf
#3}}
\immediate\write18{mv #2.pdf gfx/}
%\immediate\write18{rm #2.eps}
%\sbox{\mytmpbox}{%load the resulting pdf
\imgfade[#1]{#2}%}
}}
\newlength\templen
\newlength\temptwo
\definecolor{Maroon}{cmyk}{0, 0.87, 0.68, 0.32}
\newcommand{\abs}[1]{\left| #1 \right|}
\newcommand{\I}{ \mathrm{i} }
\newcommand{\E}{\mathrm{e}}
\newcommand{\D}{\mathrm{d}}
\newcommand{\up}{\uparrow}
\newcommand{\dw}{\downarrow}
\DeclareMathOperator{\tr}{Tr}
\DeclareMathOperator{\sgn}{sgn}
\DeclareMathOperator{\Res}{Res}
\newcommand{\mat}[1]{\mathbf{#1}}
\newcommand{\identity}{\mat{1}}
\newcommand{\matgr}[1]{\boldsymbol{#1}} % Setzt griechische Buchstaben, die eine Matrix bezeichnen fett.
\newcommand{\dket}[1]{\left| \right. \! #1 \! \left. \right\rangle_\text{D}}
\newcommand{\dbra}[1]{\left\langle \right. \! #1 \! \left. \right|_\text{D}}
\newcommand{\sket}[1]{\left| \right. \! #1 \! \left. \right\rangle_\text{S}}
\newcommand{\sbra}[1]{\left\langle \right. \! #1 \! \left. \right|_\text{S}}
\newcommand{\ket}[1]{\left| \right. \! #1 \! \left. \right\rangle}
\newcommand{\bra}[1]{\left\langle \right. \! #1 \! \left. \right|}
\newcommand{\thavg}[1]{\left\langle \right. \! #1 \! \left. \right\rangle}
\newenvironment{changemargin}[2]{%
\begin{list}{}{%
\setlength{\topsep}{0pt}%
\setlength{\leftmargin}{#1}%
\setlength{\rightmargin}{#2}%
\setlength{\listparindent}{\parindent}%
\setlength{\itemindent}{\parindent}%
\setlength{\parsep}{\parskip}%
}%
\item[]}{\end{list}}
% \definecolor{purple}{rgb}{0.6,0.,0.6}
% \definecolor{purple2}{rgb}{0.5,0.,0.5}
% \definecolor{darkgreen}{rgb}{0.0,0.5,0.0}
% \definecolor{firebrick}{rgb}{0.69,0.13,0.13}
%
%
% \definecolor{darkred}{rgb}{0.54,0.0,0.0}
% \definecolor{indigo}{rgb}{0.29,0.0,0.51}
% \definecolor{lightblue}{rgb}{0.9,0.9,1.}
% \definecolor{darkblue}{rgb}{0.0,0.0,0.5}
\AtBeginSection[]{
\begin{frame}
\vfill
\begin{center}
\usebeamercolor[fg]{title}
\usebeamerfont{title}\insertsectionhead\par%
\end{center}
\vfill
\end{frame}
}
\author{Florian Goth, Christoph Brüning, Fakher Assaad}
\date{01. July 2021}
%\institute[Uni Würzburg]{Universit\"at W\"urzburg\\Institut f\"ur Theoretische Physik und Astrophysik}
\institute[SFB1170/ct.qmat]{Universität Würzburg\\Institut für Theoretische Physik und Astrophysik}
\title[]{Data Management in ct.qmat}
\subtitle{-- An overview/introduction --}
%\logo{\includegraphics[height=0.5cm]{uniwue.png}}
\begin{document}
\begin{frame}
\titlepage
\end{frame}
\begin{frame}
\frametitle{Cluster of Excellence ct.qmat}
\vspace{-2em}
\includegraphics[width=0.7\textwidth]{gfx/logo_transparent.png}
\vfill
\begin{itemize}
\item Two sites: Würzburg, Dresden
\item Diverse groups across theory and experiment
\item Established in 2019
\item Research: Novel topological materials, quantum magnetism, topological photonics, tailoring topological functionality.
\end{itemize}
\end{frame}
\begin{frame}
\frametitle{The original grant proposal (Jan. 2018)}
\small
Simulations/Experiment are a cornerstone of good
scientific practice and are facilitated by data management solutions. Efficient data management allows to document the workflow leading to published data and facilitates
open access (OA) publication forms where all primary material is accessible.
In addition, the many locations within the cluster render collaborative tools a necessity.
Bringing both requirements together we foresee the need for collaborative
data management solutions that use established tools from the community while
at the same time leveraging the latest in storage technology.
\begin{block}{What is important}
\begin{itemize}
\item Delocalized
\item Collecting Data
\item Working on Data
\end{itemize}
->\emph{Collaborative Data Management}
\end{block}
\begin{block}{Political/external Pressures}
\begin{itemize}
\item Open Access Policy of DFG
\item Increased pressure for proper data management plans from funders
\item Publishers require open access to certain data
\item Reproducibility
\end{itemize}
\end{block}
\end{frame}
\begin{frame}
\frametitle{Research Cycle}
\vspace{-2em}
\begin{center}
\includegraphics[width=0.8\textwidth]{gfx/Research_cycle}
\end{center}
\end{frame}
\begin{frame}
\frametitle{Data Cycle}
\begin{center}
\includegraphics[width=0.8\textwidth]{gfx/cyclerdm}
\end{center}
\end{frame}
\begin{frame}
\begin{block}{What do we have to build}
-> Structures/Software that enables:
\begin{itemize}
\item collaborative decentralized work on data from various sources
\item longterm, flexible storage
\item in a way that enables the openness of the research cycle
\item makes analysis steps reproducible
\item and in a manner that satisfies expectations on data management plans
\item open, extensible infrastructure should enable flexible services on this long time scale
\end{itemize}
\end{block}
\end{frame}
\begin{frame}
\frametitle{ct.qmat Data Management Cluster(simplified)}
\begin{center}
\includegraphics[width=1.0\textwidth]{gfx/structure-simplified.pdf}
\end{center}
\end{frame}
\begin{frame}
% \frametitle{Mapping to the Research Cycle/Data Cycle}
% \begin{itemize}
% \item Planning/Organization <-> OSF.io/gitlab
% \item Data Generation <-> Measurement Devices/SuperComputers/Thinking
% \item Data Storage <-> via DataVerse into the object tore
% \item Analysis <-> JupyterHub
% \item Publication <-> OSF.io / DataVerse / gitlab
% \item ReUse/Reproduce <-> JupyterHub
% \end{itemize}
% \vfill
\begin{block}{Summary}
\begin{itemize}
\item The full cycle is available in software on the web -> Delocalized
\item Almost integrated
\item A researcher can publish projects at his will -> Full control
\item Any Service can be executed on top of the basic Infrastructure(Kubernetes + Object Store). -> Flexible
\end{itemize}
\end{block}
\vfill
\begin{block}{Status}
\begin{itemize}
\item gitlab present for a long time and we work on onboarding scientists \CheckedBox
\item Set up Storage Cluster \CheckedBox
\item -> Set up Kubernetes
\item Connect gitlab
\item Add Services: DataVerse, elabFTW, JupyterHub/BinderHub, OSF.io
\end{itemize}
\end{block}
\end{frame}
\begin{frame}
\frametitle{Preservation Outlook}
\vspace{-2em}
\begin{block}{Notes}
\begin{itemize}
\item Infrastructure is all opensource -> No vendor lock in.
\item The provided tools are all open source, hence researchers can set up open workflows with public tools.
\item We educate people about certain tools (software-carpentry.org) -> Behavioural changes.
\item In a perfect world workgoups have their whole structure in an ELN and hence the network can be made openly visible.
\item Data curators? Maybe for project based research?
\item But basically this structure is meant to be live.
\end{itemize}
\end{block}
\end{frame}
\begin{frame}
\frametitle{Last Slide}
\begin{block}{Ideas for the university}
\begin{itemize}
\item What happens after the lifetime of DFG funded project duration entities?
\item The associated infrastructure could be kept alive in a read-only mode for the forthcoming 10 years -> university guarantees, foundations.
\item open collaborative tools vs. Arbeitsrecht?
\item citable resources, DOIs?
\item Support for this infrastructure!
\end{itemize}
\end{block}
\begin{itemize}
\item Only a platform. Services/analysis need to be done by domain scientists.
\item But Quality of data and quality of scripts is only as good as the knowledge of this scientist.
\item Quality of initial data needs to be kept high -> FDM
\item Web-based research will necessitate the use of scripts. This quality needs to be fostered -> specialized research software engineers.
\end{itemize}
\end{frame}
\begin{frame}
\frametitle{ct.qmat Data Management Cluster(orig)}
\begin{center}
\includegraphics[width=1.0\textwidth]{gfx/Structure.pdf}
\end{center}
\end{frame}
\begin{frame}
\begin{block}{Short Explanations}
\begin{itemize}
\item Object Store: Abstraction Layer for storage.
\item Kubernetes: Abstraction Layer for providing services controlled via software.
\item gitlab: feature rich version control tool for Software Development.
\item DataVerse: Research Data Repository.
\item OSF.io: Open Science Framework; Integrated Platform for managing and sharing your research.
\item Jupyter Hub: A platform for providing computational environments.
\end{itemize}
\end{block}
\end{frame}
\begin{frame}
\includegraphics[width=1.0\textwidth]{gfx/dataverse_example.png}
\end{frame}
\begin{frame}
\includegraphics[width=1.0\textwidth]{gfx/jupyterlab.png}
\end{frame}
\begin{frame}
\includegraphics[width=1.0\textwidth]{gfx/osf_eln.png}
\end{frame}
\begin{frame}
\includegraphics[width=1.0\textwidth]{gfx/osf_labexample.png}
\end{frame}
\begin{frame}
\frametitle{Data Cycle}
\begin{center}
\includegraphics[width=0.8\textwidth]{gfx/cycleosf}
\end{center}
\end{frame}
\begin{frame}
\includegraphics[width=1.0\textwidth]{gfx/osf_addons.png}
\end{frame}
\end{document}