blob: 55832239edffea187ba3b401ac36e1819717433b (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
|
#!/usr/bin/env bash
set -euo pipefail
url='https://web103.reachmee.com/ext/I003/304/main?site=5&validator=a72aeedd63ec10de71e46f8d91d0d57c&lang=UK'
script='
0,/<div id="mainjoblist">/d
/<tbody>/,/<\/tbody>/!d
/<\/tr>/ {
s/.*//
x
s/\n//g
s/^ | //
/Technical and Administrative staff/d
/PhD Student Positions/d
p
d
}
/<td>/!d
/^\s*<\/td>\s*$/d
s|\s*<td>\(.*\)</td>\s*|\1|
s|.*Application deadline:.*display:\s*none">\([^<]*\)</span>.*|\1|
s|.*a href=.*reachmee.*/job.*job_id[^>]*>\([^<]*\)</a>.*|\1|
s/^/ | /
H
'
curl -s "$url" | sed -n "$script"
|