github_search_for_jni: really execute contracts
[nit.git] / contrib / github_search_for_jni / src / github_search_for_jni.nit
1 # This file is part of NIT ( http://www.nitlanguage.org ).
2 #
3 # Copyright 2014 Alexis Laferrière <alexis.laf@xymus.net>
4 #
5 # Licensed under the Apache License, Version 2.0 (the "License");
6 # you may not use this file except in compliance with the License.
7 # You may obtain a copy of the License at
8 #
9 # http://www.apache.org/licenses/LICENSE-2.0
10 #
11 # Unless required by applicable law or agreed to in writing, software
12 # distributed under the License is distributed on an "AS IS" BASIS,
13 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 # See the License for the specific language governing permissions and
15 # limitations under the License.
16
17 # Script to scan Github for repositories possibly using JNI.
18 module github_search_for_jni
19
20 import github_api
21
22 # The proprieties introduced by this redef are to be used only on HashMap
23 # representing a Github repository.
24 redef class HashMap[K, V]
25 # The repository has at least 50% Java code
26 fun has_lots_of_java: Bool
27 do
28 assert self isa HashMap[String, nullable Object]
29 var java_count = 0
30 if keys.has("Java") then java_count = self["Java"].as(Int)
31
32 if java_count == 0 then return false
33
34 var total = 0
35 for k, v in self do
36 assert v isa Int
37 total += v
38 end
39
40 return java_count * 100 / total > 50
41 end
42
43 # The repository has at least 100 lines of C code
44 fun has_some_c: Bool
45 do
46 assert self isa HashMap[String, nullable Object]
47 var c_count = 0
48 if keys.has("C") then c_count = self["C"].as(Int)
49 return c_count > 100
50 end
51 end
52
53 # Query sent to Github
54 var main_query = "language:java"
55
56 # Curl instance use for all requests
57 var curl = new GithubCurl("OAUTH TOKEN (replace with your own)", "JNI project finder (nitlanguage.org)")
58
59 if "NIT_TESTING".environ == "true" then exit 0
60
61 # Current requested page
62 var page = 0
63 var per_page = 100
64 loop
65 # Get a page of the main query
66 var uri = "https://api.github.com/search/repositories?q={main_query}&page={page}&per_page={per_page}&sort=stars"
67 var obj = curl.get_and_check(uri).as(HashMap[String, nullable Object])
68
69 # Main object has "total_count" and "items"
70 var items = obj["items"].as(Array[nullable Object])
71
72 # "items" is an array of Json objects
73 for item in items do
74 assert item isa HashMap[String, nullable Object]
75
76 # Each item has "name" and "languages_url"
77 assert item.keys.has("name")
78 assert item.keys.has("languages_url")
79
80 # Download the language list
81 var lang_url = item["languages_url"].as(String)
82 var langs = curl.get_and_check(lang_url).as(HashMap[String, nullable Object])
83
84 # The project is of interest if it has lots of Java and at least some C
85 var may_be_of_interest = langs.has_lots_of_java and langs.has_some_c
86 if may_be_of_interest then print "{item["name"].to_s}: {item["forks"].to_s}; {langs.keys.join(", ")}; {item["html_url"].to_s}"
87 end
88
89 # If we got less pages than asked for, we are done!
90 if items.length < per_page then break
91
92 page += 1
93 end