-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathajax.php
73 lines (55 loc) · 2.01 KB
/
ajax.php
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
<?php
// Options for unicode
mb_language('uni');
mb_internal_encoding('UTF-8');
// Figure out which method we want
$task = $_GET["task"];
// This is a bit simple, but what the heck, I'm coding php...
switch ($task) {
case 'abstract':
$output = get_abstract();
break;
default:
$output = "Task not recognized";
break;
}
// Echo out whatever output we got
echo $output;
// Function which fetches an abstract
function get_abstract() {
// Get ID
$id = $_GET["id"];
$file = "data/".$id.".abstract.txt";
// Make sure we have sufficient zeros in front
for ($i = 0; $i < 10 && !file_exists( $file ); $i++)
$file = "data/".str_repeat("0",$i).$id.".abstract.txt";
// Now get contents (which are formatted as UTF-16)
$content = file_get_contents($file, FILE_TEXT);
$content = mb_convert_encoding($content, "UTF-16");
$content = utf8_urldecode($content);
$abstract = htmlentities(substr($content,18,-1));
// Do a bit of work on the abstract
$wrong = array(); $right = array();
$wrong[] = "û"; $right[] = "fi"; // fi ligature
$wrong[] = ""d"; $right[] = "≤"; // fi ligature
$wrong[] = "ï¬"; $right[] = "fi"; // fi ligature
$wrong[] = "≤"; $right[] = "≤"; // fi ligature
$wrong[] = "º"; $right[] = "κ"; // fi ligature
$wrong[] = "´"; $right[] = "δ"; // fi ligature
$wrong[] = ""¥"; $right[] = "⊥"; // fi ligature
$wrong[] = ""H"; $right[] = "≈"; // fi ligature
$wrong[] = """; $right[] = "♣"; // fi ligature
$wrong[] = "³"; $right[] = "γ"; // fi ligature
$wrong[] = "Á"; $right[] = "ρ"; // fi ligature
$wrong[] = "Ä"; $right[] = "τ"; // fi ligature
$wrong[] = "»"; $right[] = "λ"; // fi ligature
$abstract = str_replace($wrong, $right, $abstract);
// Return the abstract
return $abstract;
}
function utf8_urldecode($str) {
$str = str_replace("\\00", "%u00", $str);
$str = preg_replace("/%u([0-9a-f]{3,4})/i","&#x\\1;",urldecode($str));
return $str;
}
?>