-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathpypi.go
120 lines (103 loc) · 3.77 KB
/
pypi.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
package cheerio
import (
"fmt"
"io/ioutil"
"net/http"
"path/filepath"
"regexp"
"strings"
"github.com/beyang/cheerio/fetch"
"github.com/beyang/go-version"
)
var DefaultPyPI = &PackageIndex{URI: "https://pypi.python.org"}
type PackageIndex struct {
URI string
}
// Get names of all packages served by a PyPI server.
func (p *PackageIndex) AllPackages() ([]string, error) {
pkgs := make([]string, 0)
resp, err := http.Get(fmt.Sprintf("%s/simple", p.URI))
if err != nil {
return nil, err
}
defer resp.Body.Close()
body, err := ioutil.ReadAll(resp.Body)
if err != nil {
return nil, err
}
matches := allPkgRegexp.FindAllStringSubmatch(string(body), -1)
for _, match := range matches {
if len(match) != 3 {
return nil, fmt.Errorf("Unexpected number of submatches: %d, %v", len(match), match)
} else if match[1] != match[2] {
return nil, fmt.Errorf("Names do not match %s != %s", match[1], match[2])
} else {
pkgs = append(pkgs, match[1])
}
}
return pkgs, nil
}
var requiresTxtTarPattern = regexp.MustCompile(`(?:[^/]+/)*(?:[^/]*\.egg\-info/requires\.txt)`)
var requiresTxtEggPattern = regexp.MustCompile(`EGG\-INFO/requires\.txt`)
var requiresTxtZipPattern = requiresTxtTarPattern
// Fetches package requirements from PyPI by downloading the package archive and extracting the requires.txt file. If no such file exists (sometimes
// it doesn't), returns an error.
func (p *PackageIndex) FetchPackageRequirements(pkg string) ([]*Requirement, error) {
b, err := p.FetchRawMetadata(pkg, requiresTxtTarPattern, requiresTxtEggPattern, requiresTxtZipPattern)
if err != nil {
if strings.Contains(err.Error(), "[no-files]") { // may not have a requires.txt
return nil, nil
} else {
return nil, err
}
}
return ParseRequirements(string(b))
}
func (p *PackageIndex) FetchRawMetadata(pkg string, tarPattern, eggPattern, zipPattern *regexp.Regexp) ([]byte, error) {
files, err := p.pkgFiles(pkg)
if err != nil {
return nil, err
} else if len(files) == 0 {
return nil, fmt.Errorf("[no-files] no files found for pkg %s", pkg)
}
// Sort files in version order
version.Sort(files)
// Get the latest version
if path := lastTar(files); path != "" {
return fetch.RemoteDecompress(fmt.Sprintf("%s%s", p.URI, path), tarPattern, fetch.Tar)
} else if path := lastEgg(files); path != "" {
return fetch.RemoteDecompress(fmt.Sprintf("%s%s", p.URI, path), eggPattern, fetch.Zip)
} else if path := lastZip(files); path != "" {
return fetch.RemoteDecompress(fmt.Sprintf("%s%s", p.URI, path), zipPattern, fetch.Zip)
} else {
return nil, fmt.Errorf("[tar/zip] no tar or zip found in %+v for pkg %s", files, pkg)
}
}
var allPkgRegexp = regexp.MustCompile(`<a href='([A-Za-z0-9\._\-]+)'>([A-Za-z0-9\._\-]+)</a><br/>`)
var pkgFilesRegexp = regexp.MustCompile(`<a href="([/A-Za-z0-9\._\-]+)#md5=[0-9a-z]+"[^>]*>([A-Za-z0-9\._\-]+)</a><br/>`)
var requirementRegexp = regexp.MustCompile(`(?P<package>[A-Za-z0-9\._\-]+)(?:\[([A-Za-z0-9\._\-]+)\])?\s*(?:(?P<constraint>==|>=|>|<|<=)\s*(?P<version>[A-Za-z0-9\._\-]+)(?:\s*,\s*[<>=!]+\s*[a-z0-9\.]+)?)?`)
var reqHeaderRegexp = regexp.MustCompile(`\[[A-Za-z0-9\._\-]+\]`)
// Helpers
func (p *PackageIndex) pkgFiles(pkg string) ([]string, error) {
files := make([]string, 0)
uriPath := fmt.Sprintf("/simple/%s", pkg)
uri := fmt.Sprintf("%s%s", p.URI, uriPath)
resp, err := http.Get(uri)
if err != nil {
return nil, err
}
defer resp.Body.Close()
body, err := ioutil.ReadAll(resp.Body)
if err != nil {
return nil, err
}
matches := pkgFilesRegexp.FindAllStringSubmatch(string(body), -1)
for _, match := range matches {
if len(match) != 3 {
return nil, fmt.Errorf("Unexpected number of submatches: %d, %v", len(match), match)
} else {
files = append(files, filepath.Clean(filepath.Join(uriPath, match[1])))
}
}
return files, nil
}