forked from hpcugent/vsc_user_docs
-
Notifications
You must be signed in to change notification settings - Fork 0
/
glossary.tex
206 lines (206 loc) · 10.5 KB
/
glossary.tex
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
\newglossaryentry{cluster}
{
name={cluster},
description={A group of compute nodes},
}
\newglossaryentry{compute-node}
{
name={compute node},
description={The computational units on which batch or interactive jobs are processed. A compute node is pretty much comparable to a single personal computer. It contains one or more sockets, each holding a single CPU. Some nodes also contain one or more GPGPUs. The compute node is equipped with memory (RAM) that is accessible by all its CPUs},
}
\newglossaryentry{core}
{
name={core},
description={An individual compute unit inside a CPU. A CPU typically contains one or more cores},
}
\newglossaryentry{CPU}
{
name={CPU},
description={A central processing unit. A CPU is a consumable resource. A compute node typically contains one or more CPUs},
}
\newglossaryentry{distributed-memory-system}
{
name={distributed memory system},
description={Computing system consisting of many compute nodes connected by a network, each with their own memory. Accessing memory on a neighbouring node is possible but requires explicit communication},
}
\newglossaryentry{FLOPS}
{
name={FLOPS},
description={FLOPS is short for ``Floating-point Operations Per second'', i.e., the number of (floating-point) computations that a processor can perform per second},
}
\newglossaryentry{FTP}
{
name={FTP},
description={File Transfer Protocol, used to copy files between distinct machines (over a network.) FTP is unencrypted, and as such blocked on certain systems. SFTP or SCP are secure alternatives to FTP},
}
\newglossaryentry{GPGPU}
{
name={GPGPU},
description={A general purpose graphical processing unit. A GPGPU is a consumable resource. A GPGPU is a GPU that is used for highly parallel general purpose calculations. A compute node may contain zero, one or more GPGPUs},
}
\newglossaryentry{grid}
{
name={grid},
description={A group of clusters},
}
\newglossaryentry{HPC}
{
name={HPC},
description={High Performance Computing, high performance computing and multiple-task computing on a supercomputer. The \hpcInfra is the HPC infrastructure at the \university},
}
\newglossaryentry{L1d}
{
name={L1d},
description={Level 1 data cache, often called \textbf{primary cache}, is a static memory integrated with the CPU core that is used to store data recently accessed by a CPU and also data which may be required by the next operations},
}
\newglossaryentry{L2d}
{
name={L2d},
description={Level 2 data cache, also called \textbf{secondary cache}, is a memory that is used to store recently accessed data and also data, which may be required for the next operations. The goal of having the level 2 cache is to reduce data access time in cases when the same data was already accessed before.},
}
\newglossaryentry{L3d}
{
name={L3d},
description={Level 3 data cache. Extra cache level built into motherboards between the microprocessor and the main memory},
}
\newglossaryentry{LLC}
{
name={LLC},
description={The Last Level Cache is the last level in the memory hierarchy before main memory. Any memory requests missing here must be serviced by local or remote DRAM, with significant increase in latency when compared with data serviced by the cache memory},
}
\newglossaryentry{InfiniBand}
{
name={InfiniBand},
description={A high speed switched fabric computer network communications link used in \hpc},
}
\newglossaryentry{job-constraints}
{
name={job constraints},
description={A set of conditions that must be fulfilled for the job to start},
}
\newglossaryentry{LAN}
{
name={LAN},
description={Local Area Network},
}
\newglossaryentry{Linux}
{
name={Linux},
description={An operating system, similar to UNIX},
}
\newglossaryentry{login-node}
{
name={login node},
description={On \hpc clusters, login nodes serve multiple functions. From a login node you can submit and monitor batch jobs, analyse computational results, run editors, plots, debuggers, compilers, do housekeeping chores as adjust shell settings, copy files and in general manage your account. You connect to these servers when want to start working on the \hpcInfra},
}
\newglossaryentry{memory}
{
name={memory},
description={A quantity of physical memory (RAM). Memory is provided by compute nodes. It is required as a constraint or consumed as a consumable resource by jobs. Within Moab, memory is tracked and reported in megabytes (MB)},
}
\newglossaryentry{metrics}
{
name={metrics},
description={A measure of some property, activity or performance of a computer sub-system. These metrics are visualised by graphs in, e.g., Ganglia},
}
\newglossaryentry{Moab}
{
name={Moab},
description={Moab is a job scheduler, which allocates resources for jobs that are requesting resources},
}
\newglossaryentry{modules}
{
name={modules},
description={\hpc uses an open source software package called ``Environment Modules'' (Modules for short) which allows you to add various path definitions to your shell environment},
}
\newglossaryentry{MPI}
{
name={MPI},
description={MPI stands for Message-Passing Interface. It supports a parallel programming method designed for distributed memory systems, but can also be used well on shared memory systems},
}
\newglossaryentry{node}
{
name={node},
description={See \gls{compute-node}},
}
\newglossaryentry{node-attribute}
{
name={node attribute},
description={A node attribute is a non-quantitative aspect of a node. Attributes typically describe the node itself or possibly aspects of various node resources such as processors or memory. While it is probably not optimal to aggregate node and resource attributes together in this manner, it is common practice. Common node attributes include processor architecture, operating system, and processor speed. Jobs often specify that resources be allocated from nodes possessing certain node attributes},
}
\newglossaryentry{PBS-TORQUE}
{
name={PBS, TORQUE},
description={ or \strong{OpenPBS} are Open Source resource managers, which are responsible for collecting status and health information from compute nodes and keeping track of jobs running in the system. It is also responsible for spawning the actual executable that is associated with a job, e.g., running the executable on the corresponding compute node. Client commands for submitting and managing jobs can be installed on any host, but in general are installed and used from the Login nodes},
}
\newglossaryentry{processor}
{
name={processor},
description={A processing unit. A processor is a consumable resource. A processor can be a CPU or a (GP)GPU},
}
\newglossaryentry{queue}
{
name={queue},
description={PBS/TORQUE queues, or ``classes'' as Moab refers to them, represent groups of computing resources with specific parameters. A queue with a 12 hour runtime or ``walltime'' would allow jobs requesting 12 hours or less to use this queue},
}
\newglossaryentry{scp}
{
name={scp},
description={Secure Copy is a protocol to copy files between distinct machines. SCP or scp is used extensively on \hpc clusters to stage in data from outside resources},
}
\newglossaryentry{scratch}
{
name={scratch},
description={Supercomputers generally have what is called scratch space: storage available for temporary use. Use the scratch filesystem when, for example you are downloading and uncompressing applications, reading and writing input/output data during a batch job, or when you work with large datasets. Scratch is generally a lot faster then the Data or Home filesystem},
}
\newglossaryentry{sftp}
{
name={sftp},
description={Secure File Transfer Protocol, used to copy files between distinct machines},
}
\newglossaryentry{shared-memory-system}
{
name={shared memory system},
description={Computing system in which all of the CPUs share one global memory space. However, access times from a CPU to different regions of memory are not necessarily uniform. This is called NUMA: Non-uniform memory access. Memory that is closer to the CPU your process is running on will generally be faster to access than memory that is closer to a different CPU. You can pin processes to a certain CPU to ensure they always use the same memory},
}
\newglossaryentry{SSD}
{
name={SSD},
description={Solid-State Drive. This is a kind of storage device that is faster than a traditional hard disk drive},
}
\newglossaryentry{SSH}
{
name={SSH},
description={Secure Shell (SSH), sometimes known as Secure Socket Shell, is a Unix-based command interface and protocol for securely getting access to a remote computer. It is widely used by network administrators to control Web and other kinds of servers remotely. SSH is actually a suite of three utilities (slogin, ssh, and scp) that are secure versions of the earlier UNIX utilities, rlogin, rsh, and rcp. SSH commands are encrypted and secure in several ways. Both ends of the client/server connection are authenticated using a digital certificate, and passwords are protected by encryption. Popular implementations include OpenSSH on Linux/Mac and Putty on Windows},
}
\newglossaryentry{ssh-keys}
{
name={ssh-keys},
description={OpenSSH is a network connectivity tool, which encrypts all traffic including passwords to effectively eliminate eavesdropping, connection hijacking, and other network-level attacks. SSH-keys are part of the OpenSSH bundle. On \hpc clusters, ssh-keys allow password-less access between compute nodes while running batch or interactive parallel jobs},
}
\newglossaryentry{supercomputer}
{
name={supercomputer},
description={A computer with an extremely high processing capacity or processing power},
}
\newglossaryentry{swap-space}
{
name={swap space},
description={A quantity of virtual memory available for use by batch jobs. Swap is a consumable resource provided by nodes and consumed by jobs},
}
\newglossaryentry{TLB}
{
name={TLB},
description={Translation Look-aside Buffer, a table in the CPU's memory that contains information about the virtual memory pages the CPU has accessed recently. The table cross-references a program's virtual addresses with the corresponding absolute addresses in physical memory that the program has most recently used. The TLB enables faster computing because it allows the address processing to take place independent of the normal address-translation pipeline},
}
\newglossaryentry{walltime}
{
name={walltime},
description={Walltime is the length of time specified in the job script for which the job will run on a batch system, you can visualise walltime as the time measured by a wall mounted clock (or your digital wrist watch). This is a computational resource},
}
\newglossaryentry{worker-node}
{
name={worker node},
description={See \gls{compute-node}},
}
\input{glossary_cloud}