TL;DR; Most repos say they support both php5 and php7, but php7 only repos are growing. Most projects started with php5.3 in mind and are not compatible with lower versions.
I took the data from Github database on google cloud with BigQuery. This returned 114.113 php repositories that use composer.
Show the code
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
--get the data
SELECT
files.repo_name,
REGEXP_EXTRACT(contents.content,r'(.*["|\']php["|\'].*:.*)') AS version
FROM
[bigquery-public-data:github_repos.contents] AS contents
JOIN (
SELECT
path,
repo_name,
id
FROM
[bigquery-public-data:github_repos.files]
WHERE
path LIKE 'composer.json'
) AS files
ON
(contents.id == files.id)
WHERE
NOT binary
AND files.path LIKE "composer.json"
AND REGEXP_MATCH(contents.content,r'.*["|\']php["|\'].*:.*')
GROUP BY
files.repo_name,
version
From the distribution of php versions, we can see that most of them say that they support both php5 and php7. This has to be taken with a grain of salt because there are a lot of php5 repos that are not updated and were created before php7. The owners didn't bother inserting an upper limit:
Show the code
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
%matplotlib inline
data_all = pd.read_csv(
"data/php-github-versions/all.csv"
)
data_all_version_dummies = data_all["version"]\
.str.replace("|", ",")\
.str.replace('"',"")\
.str.replace("'","")\
.str.replace(" ","")\
.str.replace("\t","")\
.str.replace("\n","")\
.str.replace("-", ",")\
.str.get_dummies(sep=",")
data_all_version_dummies_cleaned = data_all_version_dummies.copy().drop(["DEV", "dev", "\xa0\xa0\xa0\xa0>=5.3.2", "<", "<="], axis=1)
any_5_version = ['^5', '^5.0', '^5.0.0', '5.*', '<5.7.0', '<6.0.0', '<7', '<7.0', '~5', '>=5', '>=5.0', '>=5.0.0', '>5.0', '>5.0.0', '>=5.0.5',
'>=5.0.2', '>=5.0.3', '>=5.0.1']
stuck_on_5_from_5_1 = ['^5.1']
stuck_on_5_from_5_2 = ['^5.2', '^5.2.4', '~5.2']
stuck_on_5_3 = ['5.3', '5.3.0', '5.3.10', '5.3.29', '5.3.3', '5.3.6', '5.3.8', '5.3.9', '<5.4', '~5.3.0', '~5.3.3', '~5.3.8']
stuck_on_5_from_5_3 = ['^5.3', '^5.3.0', '^5.3.10', '^5.3.2', '^5.3.3', '^5.3.5', '^5.3.6', '^5.3.9', '~5.3', '>=5.3.6<7.0.0', '>=5.3.9<7.0']
stuck_on_5_4 = ['5.4', '5.4.*', '5.4.0', '5.4.16', '5.4.37', '5.4.43', '5.4.45', '5.4.8', '<5.5', '~5.4.0', '~5.4.11', '=5.4.0', '=5.4.4']
stuck_on_5_from_5_4 = ['^5.4', '^5.4.0', '^5.4.25', '^5.4.3', '^5.4.37', '^5.4.4', '^5.4.7', '^5.4.8', '~5.4', '>=5.4.0<7.0.0', '>=5.4<7']
stuck_on_5_5 = ['5.5', '5.5.*', '5.5.0', '5.5.11', '5.5.12', '5.5.14', '5.5.33', '5.5.38', '5.5.5', '5.5.9', '5.5.x', '<5.6',
'~5.5.11', '~5.5.12', '~5.5.16', '~5.5.18', '~5.5.22', '~5.5.9', '~5.5.0', '<=5.5.10', '<=5.5.38']
stuck_on_5_from_5_5 = ['^5.5', '^5.5.0', '^5.5.10', '^5.5.11', '^5.5.12', '^5.5.14', '^5.5.16', '^5.5.3', '^5.5.6', '^5.5.9', '~5.5', '>=5.5<7.0',
'>=5.5.0<6.0']
stuck_on_5_6 = ['5.6', '5.6.*', '5.6.0', '5.6.11', '5.6.14', '5.6.16', '5.6.17', '5.6.24', '5.6.26', '5.6.3', '5.6.30', '5.6.31','5.6.8', '5.6.9',
'~5.6.0', '~5.6.1', '~5.6.10', '~5.6.12', '~5.6.19', '~5.6.3', '~5.6.30', '~5.6.5', '~5.6.7', '~5.6.9', '~5.6', '<5.7'
'^5.6', '^5.6.0', '^5.6.1', '^5.6.10', '^5.6.13', '^5.6.19', '^5.6.2', '^5.6.23', '^5.6.24', '^5.6.25', '^5.6.30', '^5.6.4', '^5.6.6',
'=5.6.16', '<=5.6.23', '<=5.6.99']
stuck_on_7_0 = ['7.0', '7.0.*', '7.0.0', '7.0.10', '7.0.15', '7.0.2', '7.0.4', '7.0.5', '7.0.6', '7.0.7', '7.0.x', '<7.1',
'~7.0.0', '~7.0.3', '~7.0.6', '~7.0.7', '~7.0.8', '~7.0.9', '>=7.0.2<=7.0.4']
only_7_1 = ['7.1', '7.1.*', '7.1.0', '7.1.1', '7.1.9', '7.1.x', '^7.1', '^7.1.0', '^7.1.1', '^7.1.3', '^7.1.4', '^7.1.8', '~7.1', '~7.1.0', '~7.1.1',
'>=7.1', '>=7.1.0', '>=7.1.0<.0', '>=7.1.1', '>=7.1.2', '>=7.1.3', '>=7.1.4', '>=7.1.5', '>=7.1.7', '>=7.1.8', '>7.1', '>7.1.0']
both_7_0_and_7_1 = ['7', '7.*', '7.*.*', '~7', '~7.0', '<7.2', '<7.2.0', '<7.3.0', '^7', '^7.0', '^7.0.0', '^7.0.1', '^7.0.10', '^7.0.16',
'^7.0.3', '^7.0.4', '^7.0.5', '^7.0.6', '^7.0.7', '^7.0.8', '^7.0.9', '^7.0<7.2', '>=7”', '>=7.0.3', '>=7.0.4', '>=7.0.6',
'>=7.0.7', '>=7.0.8', '>=7.0.9', '>=7.00.0', '>=7.0<7.2', '>=7.0<7.3', '>=7.0<=7.1', '>=7', '>=7.0', '>=7.0.0', '>=7.0.0<7.2',
'>=7.0.0<7.2.0', '>=7.0.1', '>=7.0.10', '>=7.0.10<7.2', '>=7.0.11', '>=7.0.12', '>=7.0.13', '>=7.0.14', '>=7.0.15', '>=7.0.2',
'<=7.1', '<=7.1.99', '>7', '>7.0', '>7.0.0', '>=5.7']
both_5_and_7_explicit = ['>=5.6<7.2', '>=5.6<=7.1', '>5.3.3<7.1', '>=5.6.19<7.2']
from_5_1_to_7_optimistic = ['>=5.1', '>=5.1.0', '>=5.1.2', '>=5.1.3', '>=5.1.6']
from_5_2_to_7_optimistic = ['>=5.2', '>=5.2.0', '>=5.2.1', '>=5.2.10', '>=5.2.11', '>=5.2.12', '>=5.2.14', '>=5.2.17', '>=5.2.2', '>=5.2.20',
'>=5.2.3', '>=5.2.4', '>=5.2.5', '>=5.2.6', '>=5.2.7', '>=5.2.8', '>=5.2.9','>5.2', '>5.2.4']
from_5_3_to_7_optimistic = ['>5.3', '>5.3.0', '>5.3.10', '>5.3.2', '>5.3.3', '>5.3.3<', '>5.3.8', '>5.3.9', '>=5.3', '>=5.3.*', '>=5.3.0',
'>=5.3.1', '>=5.3.10', '>=5.3.12', '>=5.3.13', '>=5.3.14', '>=5.3.15', '>=5.3.16', '>=5.3.17', '>=5.3.18', '>=5.3.19',
'>=5.3.2', '>=5.3.23', '>=5.3.24', '>=5.3.26', '>=5.3.27', '>=5.3.28', '>=5.3.29', '>=5.3.3', '>=5.3.3.', '>=5.3.3.3',
'>=5.3.4', '>=5.3.5', '>=5.3.6', '>=5.3.7', '>=5.3.8', '>=5.3.9', '>=5.3<']
from_5_4_to_7_optimistic = ['>=5.4', '>=5.4.0', '>=5.4.0<', '>=5.4.1', '>=5.4.10', '>=5.4.11', '>=5.4.12', '>=5.4.13', '>=5.4.14', '>=5.4.16',
'>=5.4.17', '>=5.4.19', '>=5.4.2', '>=5.4.20', '>=5.4.21', '>=5.4.22', '>=5.4.23', '>=5.4.24', '>=5.4.26', '>=5.4.27',
'>=5.4.28', '>=5.4.29', '>=5.4.3', '>=5.4.30', '>=5.4.31', '>=5.4.34', '>=5.4.35', '>=5.4.36', '>=5.4.37', '>=5.4.38',
'>=5.4.39', '>=5.4.4', '>=5.4.40', '>=5.4.41', '>=5.4.42', '>=5.4.43', '>=5.4.45', '>=5.4.5', '>=5.4.6', '>=5.4.7',
'>=5.4.8', '>=5.4.9', '>=5.4<', '>5.4', '>5.4.0', '>5.4.1', '>5.4.10', '>5.4.16']
from_5_5_to_7_optimistic = ['>=5.5.1', '>=5.5.10', '>=5.5.11', '>=5.5.12', '>=5.5.13', '>=5.5.14', '>=5.5.15', '>=5.5.16', '>=5.5.18', '>=5.5.19',
'>=5.5.2', '>=5.5.21', '>=5.5.23', '>=5.5.24', '>=5.5.29', '>=5.5.3', '>=5.5.30', '>=5.5.31', '>=5.5.32', '>=5.5.33',
'>=5.5.34', '>=5.5.36', '>=5.5.37', '>=5.5.38', '>=5.5.4', '>=5.5.5', '>=5.5.6', '>=5.5.8', '>=5.5.9',
'>=5.5', '>=5.5.', '>=5.5.*', '>=5.5.0', '>5.5', '>5.5.0', '>5.5.9']
from_5_6_to_7_optimistic = ['>=5.6', '>=5.6.*', '>=5.6.0', '>=5.6.1', '>=5.6.10', '>=5.6.11', '>=5.6.12', '>=5.6.13', '>=5.6.14', '>=5.6.15',
'>=5.6.16', '>=5.6.17', '>=5.6.18', '>=5.6.19', '>=5.6.2', '>=5.6.20', '>=5.6.21', '>=5.6.22', '>=5.6.23',
'>=5.6.24', '>=5.6.25', '>=5.6.26', '>=5.6.28', '>=5.6.29', '>=5.6.3', '>=5.6.30', '>=5.6.4', '>=5.6.4<',
'>=5.6.5', '>=5.6.6', '>=5.6.7', '>=5.6.8', '>=5.6.9', '>5.6', '>5.6.0', '>5.6.4']
stuck_on_4 = ['>=4', '>=4.0', '>=4.0.0', '>=4.0.4', '>=4.0.6', '>=4.1.0', '>=4.2', '>=4.2.0', '>=4.3', '>=4.3.0', '>=4.3.10', '>=4.3.2', '>=4.4.0',
'>=4.4.9', '>4.4.0']
final_stuck_on_4 = data_all_version_dummies_cleaned.filter(stuck_on_4, axis=1).sum().sum() # 71
final_from_5_6_to_7_optimistic = data_all_version_dummies_cleaned.filter(from_5_6_to_7_optimistic, axis=1).sum().sum() # 6024
final_from_5_5_to_7_optimistic = data_all_version_dummies_cleaned.filter(from_5_5_to_7_optimistic, axis=1).sum().sum() # 17030
final_from_5_4_to_7_optimistic = data_all_version_dummies_cleaned.filter(from_5_4_to_7_optimistic, axis=1).sum().sum() # 25504
final_from_5_3_to_7_optimistic = data_all_version_dummies_cleaned.filter(from_5_3_to_7_optimistic, axis=1).sum().sum() # 44096
final_from_5_2_to_7_optimistic = data_all_version_dummies_cleaned.filter(from_5_2_to_7_optimistic, axis=1).sum().sum() # 10474
final_from_5_1_to_7_optimistic = data_all_version_dummies_cleaned.filter(from_5_1_to_7_optimistic, axis=1).sum().sum() # 276
final_both_5_and_7_explicit = data_all_version_dummies_cleaned.filter(both_5_and_7_explicit, axis=1).sum().sum() # 6
final_both_7_0_and_7_1 = data_all_version_dummies_cleaned.filter(both_7_0_and_7_1, axis=1).sum().sum() # 7776
final_only_7_1 = data_all_version_dummies_cleaned.filter(only_7_1, axis=1).sum().sum() # 1147
final_stuck_on_7_0 = data_all_version_dummies_cleaned.filter(stuck_on_7_0, axis=1).sum().sum() # 304
final_stuck_on_5_6 = data_all_version_dummies_cleaned.filter(stuck_on_5_6, axis=1).sum().sum() # 792
final_stuck_on_5_from_5_5 = data_all_version_dummies_cleaned.filter(stuck_on_5_from_5_5, axis=1).sum().sum() # 1326
final_any_5_version =data_all_version_dummies_cleaned.filter(any_5_version, axis=1).sum().sum() # 482
final_stuck_on_5_from_5_1 =data_all_version_dummies_cleaned.filter(stuck_on_5_from_5_1, axis=1).sum().sum() # 2
final_stuck_on_5_from_5_2 =data_all_version_dummies_cleaned.filter(stuck_on_5_from_5_2, axis=1).sum().sum() # 4
final_stuck_on_5_3 =data_all_version_dummies_cleaned.filter(stuck_on_5_3, axis=1).sum().sum() # 243
final_stuck_on_5_from_5_3 =data_all_version_dummies_cleaned.filter(stuck_on_5_from_5_3, axis=1).sum().sum() # 601
final_stuck_on_5_4 =data_all_version_dummies_cleaned.filter(stuck_on_5_4, axis=1).sum().sum() # 41
final_stuck_on_5_from_5_4 =data_all_version_dummies_cleaned.filter(stuck_on_5_from_5_4, axis=1).sum().sum() # 574
final_stuck_on_5_5 =data_all_version_dummies_cleaned.filter(stuck_on_5_5, axis=1).sum().sum() # 248
# 4313
stuck_on_5 = final_stuck_on_5_6 + final_stuck_on_5_from_5_5 + final_any_5_version + final_stuck_on_5_from_5_1 + final_stuck_on_5_from_5_2 + final_stuck_on_5_3 + final_stuck_on_5_from_5_3 + final_stuck_on_5_4 + final_stuck_on_5_from_5_4 + final_stuck_on_5_5
# 9227
only_7 = final_both_7_0_and_7_1 + final_only_7_1 + final_stuck_on_7_0
# 103410
both_5_and_7 = final_both_5_and_7_explicit+final_from_5_6_to_7_optimistic +final_from_5_5_to_7_optimistic+final_from_5_4_to_7_optimistic+final_from_5_3_to_7_optimistic+final_from_5_2_to_7_optimistic+final_from_5_1_to_7_optimistic
final_all = 118359
def make_autopct(values):
def my_autopct(pct):
total = sum(values)
val = int(round(pct*total/100.0))
return '{p:.2f}% ({v:,})'.format(p=pct,v=val)
return my_autopct
labels = 'Stuck on php 5', 'Only php 7', 'Other', 'Both php 5 and 7'
sizes = [stuck_on_5, only_7, final_all - stuck_on_5 - only_7 - both_5_and_7, both_5_and_7]
explode = (0, 0, 0, 0)
fig1, ax1 = plt.subplots(figsize=(12,12))
ax1.pie(sizes, explode=explode, labels=labels, autopct=make_autopct(sizes),
shadow=True, startangle=120)
ax1.axis('equal')
plt.title("Distribution of PHP versions on github from main composer.json files")
plt.figure(figsize=(10,10))
fig1.savefig("data/php-github-versions/5vs7.png")
plt.show()
From the repos that say they work both on versions 5 and 7, most of them were started with php 5.3 in mind.
Show the code
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
labels = 'From 5.6 up', 'From 5.5 up', 'From 5.4 up', 'From 5.3 up', 'From 5.2 up', 'From 5.1 up'
sizes = [final_from_5_6_to_7_optimistic,
final_from_5_5_to_7_optimistic,
final_from_5_4_to_7_optimistic,
final_from_5_3_to_7_optimistic,
final_from_5_2_to_7_optimistic,
final_from_5_1_to_7_optimistic]
explode = (0, 0, 0, 0.05, 0, 0)
fig1, ax1 = plt.subplots(figsize=(12,12))
ax1.pie(sizes, explode=explode, labels=labels, autopct=make_autopct(sizes),
shadow=True, startangle=10)
ax1.axis('equal')
plt.title("Github repositories that work on both php5 and php7")
plt.figure(figsize=(10,10))
fig1.savefig("data/php-github-versions/both.png")
plt.show()
From the repos that work only on php7, most of them work on both 7.0 and 7.1, but there are 12% which adopted the 7.1 syntax features and are incompatible with 7.0:
Show the code
1
2
3
4
5
6
7
8
9
10
11
12
13
14
labels = 'Both 7.0 and 7.1', 'Only 7.1 and up', 'Only 7.0'
sizes = [final_both_7_0_and_7_1,
final_only_7_1,
final_stuck_on_7_0]
explode = (0, 0, 0)
fig1, ax1 = plt.subplots(figsize=(12,12))
ax1.pie(sizes, explode=explode, labels=labels, autopct=make_autopct(sizes),
shadow=True, startangle=10)
ax1.axis('equal')
plt.title("Github repositories that require php7 and up")
plt.figure(figsize=(10,10))
fig1.savefig("data/php-github-versions/php7.png")
plt.show()
From the repos that are stuck on php5, most of them started with php5.5 in mind and work with php5.6 too. Over 60% work on these 2 versions:
Show the code
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
labels = 'Only php5.6', 'php5.5<7', 'Any php5 version', 'php5.2<7', 'Only php5.3', 'Only php5.4', 'Only php5.5'
sizes = [final_stuck_on_5_6,
final_stuck_on_5_from_5_5,
final_any_5_version,
final_stuck_on_5_from_5_2,
final_stuck_on_5_3,
final_stuck_on_5_4,
final_stuck_on_5_5]
explode = (0, 0, 0, 0, 0, 0, 0)
fig1, ax1 = plt.subplots(figsize=(12,12))
ax1.pie(sizes, explode=explode, labels=labels, autopct=make_autopct(sizes),
shadow=True, startangle=10)
ax1.axis('equal')
plt.title("Github repositories that are stuck on php5")
plt.figure(figsize=(10,10))
plt.show()
plt.savefig("data/php-github-versions/php5.png")
Full code here.