-
Notifications
You must be signed in to change notification settings - Fork 9
/
Copy pathgoogle-play.php
579 lines (541 loc) · 29.1 KB
/
google-play.php
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
<?php
/** Crawl information of a specific application in the Google Play Store
* @class GooglePlay
* @version 1.1.0
* @author Max Base & Izzy
* @copyright MIT https://github.com/BaseMax/GooglePlayWebServiceAPI/blob/master/LICENSE
* @log 2020-10-19 first release
* @log 2022-05-28 recent version
* @brief releases: 2020-10-19, 2020-10-25, 2020-10-29, 2020-10-30, 2020-12-05, 2020-12-06, 2020-12-07, 2020-12-10, 2022-05-28
* @webpage repository https://github.com/BaseMax/GooglePlayWebServiceAPI
**/
class GooglePlay {
private $debug = false; // toggle debug output
private $input = ''; // content retrieved from remote
private $lastError = '';
private $categories = []; // list of Google Play app categories
private $ua = ''; // UserAgent (default: none; currently used for debugging)
/** Turn debug mode on or off
* @method public setDebug
* @param bool debug turn debug mode on (true) or off (false)
*/
public function setDebug($debug) {
$this->debug = (bool) $debug;
}
/** Check whether debug mode is enabled
* @method public getDebug
* @return bool debug whether debug mode is turned on (true) or off (false)
*/
public function getDebug() {
return $this->debug;
}
/** set a specific user agent
* Currently, mostly for debug – to find out if a given UA would return details otherwise omitted
* @method public setUA
* @param string userAgent user agent to set
*/
public function setUA($userAgent) {
$this->ua = $userAgent;
}
/** get the currently set user agent
* @method public getUA
* @return string userAgent user which is currently set
*/
public function getUA($userAgent) {
return $this->ua;
}
/** Parse a given RegEx and return the match marked by '(?<content>)'
* @method protected getRegVal
* @param string regEx regular expression to parse
* @return string result match when found, null otherwise
*/
protected function getRegVal($regEx) {
preg_match($regEx, $this->input, $res);
if (isset($res["content"])) return trim($res["content"]);
else return null;
}
/** Create a stream context for file_get_contents
* @parameter optional string method method to use (default: GET)
* @parameter optional bool ignoreErrors whether to fetch the content even on failure status codes (default: false)
* @parameter optional string content content to send (mostly used for POST), empty for none (default)
* @parameter optional string header header variables to set (charset, cookies etc). Default: "Accept-Charset: UTF-8\r\n"
* @return resource streamContext
*/
protected function createStreamContext($method='GET', $ignoreErrors=false, $content='', $header="Accept-Charset: UTF-8\r\n") {
$opts = ['http' =>
[
'method' => strtoupper($method)
]
];
if ( !empty($this->ua) ) $opts['http']['user_agent'] = $this->ua;
if ( $ignoreErrors ) $opts['http']['ignore_errors'] = true;
if ( !empty($header) ) $opts['http']['header'] = $header;
if ( !empty($content) ) $opts['http']['content'] = $content;
return stream_context_create($opts);
}
/** Fetch app page from Google Play
* @method protected getApplicationPage
* @param string packageName identifier for the app, e.g. 'com.example.app'
* @param optional string lang language for translations. Should be ISO 639-1 two-letter code. Default: en
* @param optional string loc locale, mainly for currency. Again two-letter, but uppercase
* @return bool success
*/
protected function getApplicationPage($packageName, $lang='en_US', $loc='US') {
$link = "https://play.google.com/store/apps/details?id=" . $packageName . "&hl=$lang&gl=$loc";
if ( ! $this->input = @file_get_contents($link,false,$this->createStreamContext()) ) {
$this->lastError = $http_response_header[0];
return false;
} else {
return true;
}
}
/** Dump the raw page content for debugging purposes
* @method public dump_raw
* @param string packageName identifier for the app, e.g. 'com.example.app'
* @param optional string fileName basename of the files to write to, optionally with leading path (default: ${packageName}; extensions will be appended)
* @param optional string lang language for translations. Should be ISO 639-1 two-letter code. Default: en
* @param optional string loc locale, mainly for currency. Again two-letter, but uppercase
* @return bool success
*/
public function dump_raw($packageName, $fileName='', $lang='en_US', $loc='US') {
if ( empty($this->input) ) $this->getApplicationPage($packageName, $lang='en_US', $loc='US');
if ( empty($fileName) ) $fileName = $packageName;
file_put_contents("${fileName}.html", $this->input);
// also dump the protos
for ($i=0;$i<10;++$i) {
if ( $proto = json_decode( $this->getRegVal("/key: 'ds:${i}'. hash: '\d+'. data:(?<content>\[\[\[.+?). sideChannel: .*?\);<\/script/ims") ) ) {
file_put_contents("${fileName}_ds${i}.json", json_encode($proto, JSON_PRETTY_PRINT|JSON_UNESCAPED_SLASHES));
} elseif ( $proto = json_decode( $this->getRegVal("/key: 'ds:${i}'. hash: '\d+'. data:(?<content>\[\[.+?). sideChannel: .*?\);<\/script/ims") ) ) { // ds:3
file_put_contents("${fileName}_ds${i}.json", json_encode($proto, JSON_PRETTY_PRINT|JSON_UNESCAPED_SLASHES));
}
}
}
/** Obtain app version details
* @method public parseVersion
* @param string packageName identifier for the app, e.g. 'com.example.app'
* @return array details on the app on success, details on the error otherwise
*/
public function parseVersion($packageName) {
$lang='en';
$version = sprintf("[IoIWBc,'[[null,[%s,7]]]',null,%s]", $packageName, $packageName);
$value = sprintf("[[%s]]", $version);
$freq = urlencode($value);
$context = $this->createStreamContext('POST',true,"f.req=$freq","Content-type: application/x-www-form-urlencoded;charset=utf-8\r\nReferer: https://play.google.com/\r\n");
if ( $proto = @file_get_contents('https://play.google.com/_/PlayStoreUi/data/batchexecute?hl=' . $lang, false, $context) ) { // proto_buf/JSON data
preg_match("!HTTP/1\.\d\s+(\d{3})\s+(.+)$!i", $http_response_header[0], $match);
$response_code = $match[1];
switch ($response_code) {
case '200' : // HTTP/1.0 200 OK
break;
case '400' : // echo "! No XHR for '$pkg'\n";
case '404' : // app no longer on play
default:
return ['packageName'=>$packageName, 'versionName'=>'', 'minimumSDKVersion'=>0, 'size'=>0, 'success'=>0, 'message'=>$http_response_header[0]];
break;
}
} else { // network error (e.g. "failed to open stream: Connection timed out")
return ['packageName'=>$packageName, 'versionName'=>'', 'minimumSDKVersion'=>0, 'size'=>0, 'success'=>0, 'message'=>'network error'];
}
$proto = preg_replace('!^\)]}.*?\n!','',$proto);
$verInfo = json_decode( json_decode($proto)[0][2] );
$values = [];
$message = '';
if ( gettype($verInfo) == 'NULL' ) { // happens rarely, but happens; on a subsequent call for the same package it might succeed (temp hick-up?)
return ['packageName'=>$packageName, 'versionName'=>'', 'minimumSDKVersion'=>0, 'size'=>0, 'success'=>0, 'message'=>'Google returned no version info'];
} else {
$values['packageName'] = $packageName;
$values['versionName'] = $verInfo[1];
$values['minimumSDKVersion'] = $verInfo[2];
$values['size'] = $verInfo[0];
$values['success'] = 1;
$values['message'] = $message;
}
return $values;
}
/** Obtain details on a given app
* @method public parseApplication
* @param string packageName identifier for the app, e.g. 'com.example.app'
* @param optional string lang language for translations. Should be ISO 639-1 two-letter code. Default: en
* @param optional string loc locale, mainly for currency. Again two-letter, but uppercase
* @return array details on the app on success, details on the error otherwise
* @verbatim
* On error, the array contains 2 keys: success=0 and message=(tring with reason)
* Success is signaled by success=1, and details are given via the keys
* packageName, name, developer, category, type (game, app, family), description,
* icon, images (array of screenshot URLs), updated, version, require (min Android version),
* install (number of installs), age, rating (float), votes, price, size,
* ads (has ads: 0|1), iap (in-app-payment used: 0|1)
* if not explicitly specified otherwise, values are strings
*/
public function parseApplication($packageName, $lang='en_US', $loc='US') {
if ( ! $this->getApplicationPage($packageName, $lang, $loc) ) {
return ['success'=>0,'message'=>$this->lastError];
}
$values = [];
$message = '';
$verInfo = $this->parseVersion($packageName);
if ( $verInfo['success'] != 1 ) $verInfo = ['size'=>0, 'minimumSDKVersion'=>0, 'versionName'=>''];
$values["packageName"] = $packageName;
$values["name"] = strip_tags($this->getRegVal('/itemprop="name">(?<content>.*?)<\/h1>/'));
if ($values["name"]==null) {
return ['success'=>0, 'message'=>'No app data found'];
}
$values["developer"] = strip_tags($this->getRegVal('/href="\/store\/apps\/dev(eloper)*\?id=(?<id>[^\"]+)"([^\>]*|)>(\<span[^\>]*>)*(?<content>[^\<]+)(<\/span>|)<\/a>/i'));
$values["summary"] = strip_tags($this->getRegVal('/property="og:description" content="(?<content>[^\"]+)/i'));
$values["description"] = $this->getRegVal('/itemprop="description"[^\>]*><div class="bARER"[^\>]*>(?<content>.*?)<\/div><div class=/i');
if ( strtolower(substr($lang,0,2)) != 'en' ) { // Google sometimes keeps the EN description additionally, so we need to filter it out **TODO:** check if this still applies (2022-05-27)
if ($this->debug) echo "Original Description:\n" . $values["description"] . "\n\n";
$values["description"] = preg_replace('!.*?<div jsname="Igi1ac" style="display:none;">(.+)!ims', '$1', $values["description"]);
}
//$values["icon"] = $this->getRegVal('/<div class="JU1wdd"><div class="l8YSdd"><img src="(?<content>[^\"]+)"/i');
$values["icon"] = preg_replace('!(.*)=w\d+.*!i', '$1', $this->getRegVal('/<meta name="twitter:image" content="(?<content>[^\"]+)"/i'));
$values["featureGraphic"] = preg_replace('!(.*)=w\d+.*!i', '$1', $this->getRegVal('/<img class="oiEt0d" src="(?<content>[^\"]+)"/i'));
preg_match('/<div class="aoJE7e qwPPwf"([^\>]+|)>(?<content>.*?)<c-data/i', $this->input, $image);
if ( isset($image["content"]) ) {
preg_match_all('/<img data-src="(?<content>[^\"]+)"/i', $image["content"], $images);
if ( isset($images["content"]) && !empty($images["content"]) ) {
$values["images"] = $images["content"];
} else {
preg_match_all('/<img (class="[^\"]+")*src="[^"]*" srcset="(?<content>[^\s"]+)/i', $image["content"], $images);
if ( isset($images["content"]) ) {
$values["images"] = $images["content"];
} else {
$values["images"] = null;
}
}
} else {
$values["images"] = null;
}
if ( substr(strtolower($lang),0,2)=='en' ) {
$values["lastUpdated"] = strip_tags($this->getRegVal('/<div class="lXlx5">Updated on<\/div><div class="xg1aie">(?<content>.*?)<\/div><\/div>/i'));
$values["versionName"] = $verInfo['versionName'];
$values["minimumSDKVersion"] = $verInfo['minimumSDKVersion'];
$values["installs"] = strip_tags($this->getRegVal('/<div class="ClM7O">(?<content>[^\>]*?)<\/div><div class="g1rdde">Downloads<\/div>/i'));
$values["age"] = strip_tags($this->getRegVal('/<span itemprop="contentRating"><span>(?<content>.*?)<\/span><\/span>/i'));
$values["size"] = $verInfo['size'];
$values["video"] = $this->getRegVal('/<button aria-label="Play trailer".*?data-trailer-url="(?<content>[^\"]+?)"/i');
$values["whatsnew"] = $this->getRegVal('/<div class="SfzRHd"><div itemprop="description">(?<content>.*?)<\/div><\/div><\/section>/i');
$test = $this->getRegVal('/<span class="UIuSk">(?<content>\s*Contains ads\s*)<\/span>/i'); // <span class="UIuSk">Contains ads</span>
(empty($test)) ? $values["ads"] = 0 : $values["ads"] = 1;
$test = $this->getRegVal('/<span class="UIuSk">(?<content>\s*In-app purchases\s*)<\/span>/i'); // <span class="UIuSk">In-app purchases</span>
(empty($test)) ? $values["iap"] = 0 : $values["iap"] = 1;
} else {
$envals = $this->parseApplication($packageName);
foreach(["lastUpdated","versionName","minimumSDKVersion","installs","age","size"] as $val) $values[$val] = $envals[$val];
}
$values["rating"] = $this->getRegVal('/<div itemprop="starRating"><div class="TT9eCd"[^\>]*>(?<content>[^<]+)(<i class="[^\>]*>star<\/i>)*<\/div>/i');
$values["votes"] = $this->getRegVal('/<div class="g1rdde">(?<content>[^>]+) reviews<\/div>/i');
$values["price"] = $this->getRegVal('/<meta itemprop="price" content="(?<content>[^"]+)">/i');
// ld+json data, see https://github.com/BaseMax/GooglePlayWebServiceAPI/issues/22#issuecomment-1168397748
$d = new DomDocument();
@$d->loadHTML($this->input);
$xp = new domxpath($d);
$jsonScripts = $xp->query( '//script[@type="application/ld+json"]' );
$json = trim( @$jsonScripts->item(0)->nodeValue ); //
$data = json_decode($json,true);
if (isset($data['applicationCategory'])) {
$values["category"] = $data['applicationCategory'];
if ( substr($values["category"],0,5)=='GAME_' ) $values["type"] = "game";
elseif ( substr($values["category"],0,7)=='FAMILY?' ) $values["type"] = "family";
else $values["type"] = "app";
$cats = $this->parseCategories();
if ( $cats["success"] && !empty($cats["data"][$values["category"]]) ) $values["category"] = $cats["data"][$values["category"]]->name;
} else {
$values["category"] = null;
$values["type"] = null;
}
if ( empty($values["summary"]) && !empty($data["description"]) ) $values["summary"] = $data["description"];
if (isset($data["contentRating"])) $values["contentRating"] = $data["contentRating"];
else $values["contentRating"] = "";
if ( isset($data["aggregateRating"]) ) {
if ( !empty($data["aggregateRating"]["ratingValue"]) ) $values["rating"] = $data["aggregateRating"]["ratingValue"];
if ( !empty($data["aggregateRating"]["ratingCount"]) ) $values["votes"] = $data["aggregateRating"]["ratingCount"];
}
$proto = json_decode($this->getRegVal("/key: 'ds:5'. hash: '\d+'. data:(?<content>\[\[\[.+?). sideChannel: .*?\);<\/script/ims"));
if ( empty($values["featureGraphic"]) && !empty($proto[1][2][96][0][3][2]) ) $values["featureGraphic"] = $proto[1][2][96][0][3][2];
if ( empty($values["video"]) && !empty($proto[1][2][100][0][0][3][2]) ) $values["video"] = $proto[1][2][100][0][0][3][2];
if ( empty($values["summary"]) && !empty($proto[1][2][73][0][1]) ) $values["summary"] = $proto[1][2][73][0][1];
if ( empty($proto[1][2][69][1][0]) ) $values["developerEmail"] = ""; else $values["developerEmail"] = $proto[1][2][69][1][0];
if ( empty($proto[1][2][69][0][5][2]) ) $values["developerWebsite"] = ""; else $values["developerWebsite"] = $proto[1][2][69][0][5][2];
// reviews
$values["reviews"] = [];
if ( $proto = json_decode($this->getRegVal("/key: 'ds:8'. hash: '\d+'. data:(?<content>\[\[\[.+?). sideChannel: .*?\);<\/script/ims")) ) { // DataSource:7 = reviews
foreach($proto[0] as $rev) {
$r["review_id"] = $rev[0];
$r["reviewed_version"] = (isset($rev[10])) ? $rev[10] : '';
$r["review_date"] = isset($rev[5][0]) ? $rev[5][0] : '';
$r["review_text"] = isset($rev[4]) ? $rev[4] : '';
$r["stars"] = isset($rev[2]) ? $rev[2] : '';
$r["like_count"] = isset ($rev[6]) ? $rev[6] : '';
if ( isset($rev[9]) && !empty($rev[9]) ) {
$r["reviewer"] = [
"reviewer_id"=>$rev[9][0],
"name"=>$rev[9][1],
"avatar"=>$rev[9][3][0][3][2],
"bg_image"=>$rev[9][4][3][2]
];
} else $r["reviewer"] = [];
if ( empty($rev[7]) ) {
$r["reply"] = [];
} else {
$r["response"] = [
"responder_name"=>$rev[7][0],
"response_text"=>$rev[7][1],
"response_date"=>$rev[7][2][0]
];
}
$values["reviews"][] = $r;
}
$values["review_token"] = @$proto[1][1] ?: ''; // needed if we want to fetch more reviews later (not always set)
} else {
$values["review_token"] = '';
}
if ($this->debug) {
print_r($values);
}
$values['success'] = 1;
$values['message'] = $message;
return $values;
}
/** Obtain permissions for a given app
* @method public parsePerms
* @param string packageName identifier for the app, e.g. 'com.example.app'
* @param optional string lang language for translations. Should be ISO 639-1 two-letter code. Default: en
* @return array permission on success, details on the error otherwise
* @verbatim
* On error, the array contains 2 keys: success=0 and message=(tring with reason)
* Success is signaled by success=1, and details are given via the keys
* * perms : array[0..n] of permissions as displayed on play.google.com (i.e. the permission descriptions); unique, no grouping.
* * grouped : array of permission groups as displayed on play.google.com. Keys are the group ids as defined there.
* keys in each group array are group_name (translated name of the permission group) and perms (array[0..n])
* These perms have numeric keys (0 and 1). 0 seems always to be empty, 1 holds the permission description.
*/
public function parsePerms($packageName, $lang='en') {
$context = $this->createStreamContext('POST', true, 'f.req=%5B%5B%5B%22xdSrCf%22%2C%22%5B%5Bnull%2C%5B%5C%22' . $packageName . '%5C%22%2C7%5D%2C%5B%5D%5D%5D%22%2Cnull%2C%221%22%5D%5D%5D',
"Content-type: application/x-www-form-urlencoded;charset=utf-8\r\nReferer: https://play.google.com/\r\n");
if ( $proto = @file_get_contents('https://play.google.com/_/PlayStoreUi/data/batchexecute?rpcids=xdSrCf&bl=boq_playuiserver_20201201.06_p0&hl=' . $lang . '&authuser&soc-app=121&soc-platform=1&soc-device=1&rt=c&f.sid=-8792622157958052111&_reqid=257685', false, $context) ) { // raw proto_buf data
preg_match("!HTTP/1\.\d\s+(\d{3})\s+(.+)$!i", $http_response_header[0], $match);
$response_code = $match[1];
switch ($response_code) {
case "200" : // HTTP/1.0 200 OK
break;
case "400" : // echo "! No XHR for '$pkg'\n";
case "404" : // app no longer on play
default:
return ['success'=>0, 'grouped'=>[], 'perms'=>[], 'message'=>$http_response_header[0]];
break;
}
} else { // network error (e.g. "failed to open stream: Connection timed out")
return ['success'=>0, 'grouped'=>[], 'perms'=>[], 'message'=>'network error'];
}
$perms = $perms_unique = [];
$json = preg_replace('!.*?(\[.+?\])\s*\d.*!ims', '$1', $proto);
$arr = json_decode(json_decode($json)[0][2]);
if (!empty($arr[0])) foreach ($arr[0] as $group) { // 0: group name, 1: group icon, 2: perms, 3: group_id
if (empty($group)) continue;
$perms[$group[3][0]] = ['group_name'=>$group[0], 'perms'=>$group[2]];
foreach($group[2] as $perm) $perms_unique[] = $perm[1];
}
if (!empty($arr[1])) {
$perms['misc'] = ['group_name'=>$arr[1][0][0], 'perms'=>$arr[1][0][2]];
foreach($arr[1][0][2] as $perm) $perms_unique[] = $perm[1];
}
if (!empty($arr[2])) {
if (array_key_exists('misc',$perms)) $perms['misc']['perms'] = array_merge($perms['misc']['perms'],$arr[2]);
elseif ( is_array ($arr[1]) && is_array($arr[1][0]) && !empty($arr[1][0][0]) ) $perms['misc'] = ['group_name'=>$arr[1][0][0], 'perms'=>$arr[2]];
else $perms['misc'] = ['group_name'=>'unknown', 'perms'=>$arr[2]]; // ProtoBuf broken for this app, e.g. com.achunt.weboslauncher (perms display broken on Play website itself)
foreach($arr[2] as $perm) $perms_unique[] = $perm[1];
}
return ['success'=>1, 'message'=>'', 'grouped'=>$perms, 'perms'=>array_unique($perms_unique)];
}
/** Parse page specified by URL for playstore links and extract package names
* @method public parse
* @param optional string link link to parse; if empty or not specified, defaults to 'https://play.google.com/apps'
* @param optional bool is_url whether the link passed is an url to fetch-and-parse (true, default) or a string just to parse (false)
* @return array array of package names
* @brief this mainly is a helper for all methods parsing for app links, like parseTopApps, parseSimilar etc.
*/
public function parse($link=null, $is_url=true) {
if ( $is_url ) {
if ($link == "" || $link == null) {
$link = "https://play.google.com/apps";
}
if ( ! $this->input = @file_get_contents($link,false,$this->createStreamContext()) ) {
$this->lastError = $http_response_header[0];
return [];
} else {
$this->lastError = ''; // reset
}
} else {
$input = $link;
}
preg_match_all('/href="\/store\/apps\/details\?id=(?<ids>[^\"]+)"/i', $input, $ids);
if ( isset($ids["ids"]) ) {
$ids = $ids["ids"];
$ids = array_values(array_unique($ids));
$values = $ids;
} else {
$values = [];
}
if ($this->debug) {
print_r($values);
}
return $values;
}
/** Obtain list of top apps
* @method public parseTopApps
* @param string category name of the category to parse
* @return array array of package names
*/
public function parseTopApps() {
$link = "https://play.google.com/store/apps/top";
$data = $this->parse($link);
if ( empty($this->lastError) ) return ['success'=>1, 'message'=>'', 'data'=>$data];
else return ['success'=>0, 'message'=>$this->lastError, 'data'=>$data];
}
/** Obtain list of newest apps
* @method public parseNewApps
* @param string category name of the category to parse
* @return array array of package names
*/
public function parseNewApps() {
$link = "https://play.google.com/store/apps/new";
$data = $this->parse($link);
if ( empty($this->lastError) ) return ['success'=>1, 'message'=>'', 'data'=>$data];
else return ['success'=>0, 'message'=>$this->lastError, 'data'=>$data];
}
/** Parse Play Store page for a given category and return package names
* use this::parseCategories to obtain a list of available categories
* @method public parseCategory
* @param string category id of the category to parse
* @return array array of package names
*/
public function parseCategory($category) {
$link = "https://play.google.com/store/apps/category/" . $category;
$data = $this->parse($link);
if ( empty($this->lastError) ) return ['success'=>1, 'message'=>'', 'data'=>$data];
else return ['success'=>0, 'message'=>$this->lastError, 'data'=>$data];
}
/** Obtain list of available categories.
* Definitions of all available categories are stored in categories.jsonl using
* [JSONL](https://en.wikipedia.org/wiki/JSONL) format. This method returns them
* as array of objects with the ID as key and the properties id, name, type.
* @method public parseCategories
* @return array array of categories to be used with e.g. this::parseCategory
* @see https://developers.apptweak.com/reference/google-play-store-categories
*/
public function parseCategories($force=false) {
if ( ! empty($this->categories) && ! $force ) ['success'=>1, 'message'=>'', 'data'=>$this->categories];
$catfile = __DIR__ . '/categories.jsonl';
if ( ! file_exists($catfile) ) return ['success'=>0, 'message'=>"Category definition file '$catfile' does not exist.", 'data'=>[]];
$this->categories = [];
foreach ( file($catfile) as $line ) {
$cat = json_decode($line);
$this->categories[$cat->id] = $cat;
}
return ['success'=>1, 'message'=>'', 'data'=>$this->categories];
}
/** Obtain list of similar apps
* @method public parseSimilar
* @param string packageName package name of the app to find similars for, e.g. 'com.example.app'
* @return array array of package names
*/
public function parseSimilar($packageName) {
if ( ! $this->getApplicationPage($packageName) )
return ['success'=>0, 'message'=>$this->lastError, 'data'=>[]];
$input = $this->getRegVal('!<h2 class="sv0AUd bs3Xnd">Similar</h2></a>(?<content>.+?)(<c-wiz jsrenderer="rx5H8d"|</aside>)!ims');
if ( empty($input) )
return ['success'=>1, 'message'=>'no data found', 'data'=>[]];
return ['success'=>1, 'message'=>'', 'data'=>$this->parse($input, false)];
}
/** Obtain list of other apps by same author
* @method public parseOthers
* @param string packageName package name of the app to find similars for, e.g. 'com.example.app'
* @return array array of package names
*/
public function parseOthers($packageName) {
if ( ! $this->getApplicationPage($packageName) )
return ['success'=>0, 'message'=>$this->lastError, 'data'=>[]];
$input = $this->getRegVal('!<h2 class="sv0AUd bs3Xnd">More by [^<]*</h2></a></div><div class="W9yFB">(?<content>.+?)</c-data></c-wiz></div></div></div><script!ims');
if ( empty($input) )
return ['success'=>1, 'message'=>'no data found', 'data'=>[]];
return ['success'=>1, 'message'=>'', 'data'=>$this->parse($input, false)];
}
/** Search for apps by a given string
* @method public parseSearch
* @param string query string to search for
* @return array array of package names
*/
public function parseSearch($query) {
$link = "https://play.google.com/store/search?q=". urlencode($query) ."&c=apps";
$data = $this->parse($link);
if ( empty($this->lastError) ) {
if ( empty($data) ) return ['success'=>1, 'message'=>'no data found', 'data'=>$data];
else return ['success'=>1, 'message'=>'', 'data'=>$data];
}
else return ['success'=>0, 'message'=>$this->lastError, 'data'=>$data];
}
/* Obtain Data Safety details for a given app
* @method public parsePrivacy
* @param string packageName identifier for the app, e.g. 'com.example.app'
* @param optional string lang language for translations. Should be ISO 639-1 two-letter code. Default: en
* @return array privacy details on the app on success, details on the error otherwise
*/
public function parsePrivacy($packageName, $lang='en') {
$link = sprintf('https://play.google.com/store/apps/datasafety?id=%s&hl=%s', $packageName, $lang);
if ( $this->input = @file_get_contents($link,false,$this->createStreamContext()) ) {
preg_match("!HTTP/1\.\d\s+(\d{3})\s+(.+)$!i", $http_response_header[0], $match);
$response_code = $match[1];
switch ($response_code) {
case "200" : // HTTP/1.0 200 OK
break;
case "400" : // echo "! No XHR for '$pkg'\n";
case "404" : // app no longer on play
default:
$this->lastError = $http_response_header[0];
return ['success'=>0, 'values'=>[], 'message'=>$http_response_header[0]];
break;
}
} else { // network error (e.g. "failed to open stream: Connection timed out")
$this->lastError = 'network error';
return ['success'=>0, 'values'=>[], 'message'=>'network error'];
}
$doc = new DOMDocument();
@$doc->loadHTML($this->input);
$xp = new DOMXPath($doc);
$nlh = $xp->query("//div[@class='Mf2Txd']/h2"); // node list of headers
if ($this->debug) echo "Privacy sections: ".$nlh->length."\n";
$sections = [];
foreach($nlh as $section) {
$sname = trim ($section->nodeValue);
$node = $section->nextSibling;
$desc = ''; $extras = [];
switch ( $node->getAttribute('class') ) {
case 'ivTO9c': $desc = $node->firstChild->textContent; break;
case 'XgPdwe':
$desc = 'see extras';
foreach ($node->childNodes as $child) {
$ex = $child->firstChild->nextSibling->firstChild; // the extra detail's header
$eh = $ex->nodeValue;
$ex = $ex->nextSibling; // the extra's details
$ed = $ex->nodeValue;
$extras[] = ['name'=>$eh, 'desc'=>$ed];
}
break;
default: if ($this->debug) echo "Got unknown class '". strtolower($node->getAttribute('class'))."' for section description\n"; break;
}
$node = $node->nextSibling;
if ( empty($extras) ) {
foreach ($node->childNodes as $child) {
$ex = $child->firstChild->firstChild->firstChild->firstChild->firstChild->nextSibling->firstChild; // the extra detail's header
$eh = $ex->nodeValue;
$ex = $ex->nextSibling; // the extra's details
$ed = $ex->nodeValue;
$extras[] = ['name'=>$eh, 'desc'=>$ed];
}
}
$sections[] = ['name'=>$sname, 'desc'=>$desc, 'extras' => $extras];
}
return ['success'=>1, 'values'=>$sections, 'message'=>''];
}
}