Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Analysis updates #2642

Merged
merged 8 commits into from
Sep 25, 2023
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
37 changes: 18 additions & 19 deletions Sources/App/Commands/Analyze.swift
Original file line number Diff line number Diff line change
Expand Up @@ -140,7 +140,7 @@ extension Analyze {

case .limit(let limit):
logger.info("Analyzing (limit: \(limit)) ...")
let packages = try await Package.fetchCandidates(database, for: .analysis, limit: limit).get()
let packages = try await Package.fetchCandidates(database, for: .analysis, limit: limit)
try await analyze(client: client,
database: database,
logger: logger,
Expand Down Expand Up @@ -339,7 +339,6 @@ extension Analyze {
url: package.model.url)
} catch {
logger.info("fetch failed: \(error.localizedDescription)")
logger.info("removing directory")
try await Current.shell.run(command: .removeFile(from: cacheDir, arguments: ["-r", "-f"]))
try await clone(logger: logger, cacheDir: cacheDir, url: package.model.url)
}
Expand Down Expand Up @@ -422,26 +421,26 @@ extension Analyze {
guard let defaultBranch = package.repository?.defaultBranch
.map({ Reference.branch($0) })
else {
throw AppError.genericError(package.model.id, "Package must have default branch - aborting analysis")
throw AppError.analysisError(package.model.id, "Package must have default branch")
}

do {
let tags = try await Current.git.getTags(cacheDir)

let references = [defaultBranch] + tags
return try await references
.mapAsync { ref in
let revInfo = try await Current.git.revisionInfo(ref, cacheDir)
let url = package.model.versionUrl(for: ref)
return try Version(package: package.model,
commit: revInfo.commit,
commitDate: revInfo.date,
reference: ref,
url: url)
}
} catch {
throw error
guard try await Current.git.hasBranch(defaultBranch, cacheDir) else {
throw AppError.analysisError(package.model.id, "Default branch '\(defaultBranch)' does not exist in checkout")
Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Add a check to handle this particular error. We may want to do an audit where we throw anything that isn't an AppError without an id - or simply ensure we wrap them all before we run updatePackages.

}

let tags = try await Current.git.getTags(cacheDir)

let references = [defaultBranch] + tags
return try await references
.mapAsync { ref in
let revInfo = try await Current.git.revisionInfo(ref, cacheDir)
let url = package.model.versionUrl(for: ref)
return try Version(package: package.model,
commit: revInfo.commit,
commitDate: revInfo.date,
reference: ref,
url: url)
}
}


Expand Down
6 changes: 5 additions & 1 deletion Sources/App/Commands/Common.swift
Original file line number Diff line number Diff line change
Expand Up @@ -43,7 +43,11 @@ func updatePackages(client: Client,
}
}
for result in results {
try await updatePackage(client: client, database: database, logger: logger, result: result, stage: stage)
do {
try await updatePackage(client: client, database: database, logger: logger, result: result, stage: stage)
} catch {
logger.critical("updatePackage failed: \(error)")
}
}

logger.debug("updateStatus ops: \(results.count)")
Expand Down
2 changes: 1 addition & 1 deletion Sources/App/Commands/Ingest.swift
Original file line number Diff line number Diff line change
Expand Up @@ -94,7 +94,7 @@ func ingest(client: Client,
packages: [pkg])
case .limit(let limit):
logger.info("Ingesting (limit: \(limit)) ...")
let packages = try await Package.fetchCandidates(database, for: .ingestion, limit: limit).get()
let packages = try await Package.fetchCandidates(database, for: .ingestion, limit: limit)
await ingest(client: client,
database: database,
logger: logger,
Expand Down
2 changes: 2 additions & 0 deletions Sources/App/Core/AppEnvironment.swift
Original file line number Diff line number Diff line change
Expand Up @@ -287,6 +287,7 @@ struct Git {
var firstCommitDate: (String) async throws -> Date
var lastCommitDate: (String) async throws -> Date
var getTags: (String) async throws -> [Reference]
var hasBranch: (Reference, String) async throws -> Bool
var revisionInfo: (Reference, String) async throws -> RevisionInfo
var shortlog: (String) async throws -> String

Expand All @@ -295,6 +296,7 @@ struct Git {
firstCommitDate: firstCommitDate(at:),
lastCommitDate: lastCommitDate(at:),
getTags: getTags(at:),
hasBranch: hasBranch(_:at:),
revisionInfo: revisionInfo(_:at:),
shortlog: shortlog(at:)
)
Expand Down
4 changes: 4 additions & 0 deletions Sources/App/Core/Extensions/ShellOutCommand+ext.swift
Original file line number Diff line number Diff line change
Expand Up @@ -38,6 +38,10 @@ extension ShellOutCommand {
.init(command: "git", arguments: ["log", "--max-parents=0", "-n1", #"--format=format:"%ct""#])
}

static func gitHasBranch(_ branch: String) -> Self {
.init(command: "git", arguments: ["show-ref", "--verify", "--quiet", "refs/heads/\(branch.quoted)"])
}

static var gitLastCommitDate: Self {
.init(command: "git", arguments: ["log", "-n1", #"--format=format:"%ct""#])
}
Expand Down
10 changes: 10 additions & 0 deletions Sources/App/Core/Git.swift
Original file line number Diff line number Diff line change
Expand Up @@ -63,6 +63,16 @@ extension Git {
.map { Reference.tag($0, $1) }
}

static func hasBranch(_ reference: Reference, at path: String) async throws -> Bool {
guard let branchName = reference.branchName else { return false }
do {
_ = try await Current.shell.run(command: .gitHasBranch(branchName), at: path)
return true
} catch {
return false
}
}

static func revisionInfo(_ reference: Reference, at path: String) async throws -> RevisionInfo {
let separator = "-"
let res = String(
Expand Down
4 changes: 2 additions & 2 deletions Sources/App/Models/Package.swift
Original file line number Diff line number Diff line change
Expand Up @@ -280,8 +280,8 @@ extension Package {

static func fetchCandidates(_ database: Database,
for stage: ProcessingStage,
limit: Int) -> EventLoopFuture<[Joined<Package, Repository>]> {
Joined.query(on: database)
limit: Int) async throws -> [Joined<Package, Repository>] {
try await Joined.query(on: database)
.filter(for: stage)
.sort(.sql(raw: "status != 'new'"))
.sort(\.$updatedAt)
Expand Down
1 change: 1 addition & 0 deletions Tests/AppTests/AnalyzeErrorTests.swift
Original file line number Diff line number Diff line change
Expand Up @@ -86,6 +86,7 @@ final class AnalyzeErrorTests: AppTestCase {
if checkoutDir.hasSuffix("foo-2") { return [.tag(1, 2, 3)] }
throw SetupError()
}
Current.git.hasBranch = { _, _ in true }
Current.git.revisionInfo = { ref, checkoutDir in
if checkoutDir.hasSuffix("foo-1") { return .init(commit: "commit \(ref)", date: .t1) }
if checkoutDir.hasSuffix("foo-2") { return .init(commit: "commit \(ref)", date: .t1) }
Expand Down
116 changes: 111 additions & 5 deletions Tests/AppTests/AnalyzerTests.swift
Original file line number Diff line number Diff line change
Expand Up @@ -157,7 +157,7 @@ class AnalyzerTests: AppTestCase {
// validation
let outDir = try checkoutDir.value.unwrap()
XCTAssert(outDir.hasSuffix("SPI-checkouts"), "unexpected checkout dir, was: \(outDir)")
XCTAssertEqual(commands.value.count, 34)
XCTAssertEqual(commands.value.count, 36)

// Snapshot for each package individually to avoid ordering issues when
// concurrent processing causes commands to interleave between packages.
Expand Down Expand Up @@ -251,6 +251,7 @@ class AnalyzerTests: AppTestCase {
Current.git.firstCommitDate = { _ in .t0 }
Current.git.lastCommitDate = { _ in .t2 }
Current.git.getTags = { _ in [.tag(1, 0, 0), .tag(1, 1, 1)] }
Current.git.hasBranch = { _, _ in true }
Current.git.revisionInfo = { ref, _ in
// simulate the following scenario:
// - main branch has moved from commit0 -> commit3 (timestamp t3)
Expand Down Expand Up @@ -311,6 +312,43 @@ class AnalyzerTests: AppTestCase {
XCTAssertEqual(versions.map(\.commit), ["commit1", "commit2", "commit3"])
}

func test_forward_progress_on_analysisError() async throws {
// Ensure a package that fails analysis goes back to ingesting and isn't stuck in an analysis loop
// setup
do {
let pkg = try savePackage(on: app.db, "https://github.com/foo/1", processingStage: .ingestion)
try await Repository(package: pkg, defaultBranch: "main").save(on: app.db)
}

Current.git.commitCount = { _ in 12 }
Current.git.firstCommitDate = { _ in .t0 }
Current.git.lastCommitDate = { _ in .t1 }
Current.git.hasBranch = { _, _ in false } // simulate analysis error via branch mismatch
Current.git.shortlog = { _ in "" }

// Ensure candidate selection is as expected
try await XCTAssertEqualAsync( try await Package.fetchCandidates(app.db, for: .ingestion, limit: 10).count, 0)
try await XCTAssertEqualAsync( try await Package.fetchCandidates(app.db, for: .analysis, limit: 10).count, 1)

// MUT
try await Analyze.analyze(client: app.client,
database: app.db,
logger: app.logger,
mode: .limit(10))

// Ensure candidate selection is now zero for analysis
// (and also for ingestion, as we're immediately after analysis)
try await XCTAssertEqualAsync( try await Package.fetchCandidates(app.db, for: .ingestion, limit: 10).count, 0)
try await XCTAssertEqualAsync( try await Package.fetchCandidates(app.db, for: .analysis, limit: 10).count, 0)

// Advance time beyond reIngestionDeadtime
Current.date = { .now.addingTimeInterval(Constants.reIngestionDeadtime) }

// Ensure candidate selection has flipped to ingestion
try await XCTAssertEqualAsync( try await Package.fetchCandidates(app.db, for: .ingestion, limit: 10).count, 1)
try await XCTAssertEqualAsync( try await Package.fetchCandidates(app.db, for: .analysis, limit: 10).count, 0)
}

func test_package_status() async throws {
// Ensure packages record success/error status
// setup
Expand All @@ -325,6 +363,7 @@ class AnalyzerTests: AppTestCase {
Current.git.firstCommitDate = { _ in .t0 }
Current.git.lastCommitDate = { _ in .t1 }
Current.git.getTags = { _ in [.tag(1, 0, 0)] }
Current.git.hasBranch = { _, _ in true }
Current.git.revisionInfo = { _, _ in .init(commit: "sha", date: .t0) }
Current.git.shortlog = { _ in
"""
Expand Down Expand Up @@ -435,7 +474,7 @@ class AnalyzerTests: AppTestCase {
mode: .limit(10))

// validation (not in detail, this is just to ensure command count is as expected)
XCTAssertEqual(commands.value.count, 38, "was: \(dump(commands.value))")
XCTAssertEqual(commands.value.count, 40, "was: \(dump(commands.value))")
// 1 packages with 2 tags + 1 default branch each -> 3 versions (the other package fails)
let versionCount = try await Version.query(on: app.db).count()
XCTAssertEqual(versionCount, 3)
Expand Down Expand Up @@ -494,9 +533,67 @@ class AnalyzerTests: AppTestCase {
XCTAssertEqual(repo?.authors, PackageAuthors(authors: [Author(name: "Person 1")], numberOfContributors: 1))
}

func test_getIncomingVersions() async throws {
// setup
Current.git.getTags = { _ in [.tag(1, 2, 3)] }
Current.git.hasBranch = { _, _ in true }
Current.git.revisionInfo = { ref, _ in .init(commit: "sha-\(ref)", date: .t0) }
do {
let pkg = Package(id: .id0, url: "1".asGithubUrl.url)
try await pkg.save(on: app.db)
try await Repository(id: .id1, package: pkg, defaultBranch: "main").save(on: app.db)
}
let pkg = try await Package.fetchCandidate(app.db, id: .id0).get()

// MUT
let versions = try await Analyze.getIncomingVersions(client: app.client, logger: app.logger, package: pkg)

// validate
XCTAssertEqual(versions.map(\.commit).sorted(), ["sha-1.2.3", "sha-main"])
}

func test_getIncomingVersions_default_branch_mismatch() async throws {
// setup
Current.git.hasBranch = { _, _ in false} // simulate branch mismatch
do {
let pkg = Package(id: .id0, url: "1".asGithubUrl.url)
try await pkg.save(on: app.db)
try await Repository(id: .id1, package: pkg, defaultBranch: "main").save(on: app.db)
}
let pkg = try await Package.fetchCandidate(app.db, id: .id0).get()

// MUT
do {
_ = try await Analyze.getIncomingVersions(client: app.client, logger: app.logger, package: pkg)
XCTFail("expected an analysisError to be thrown")
} catch let AppError.analysisError(.some(pkgId), msg) {
// validate
XCTAssertEqual(pkgId, .id0)
XCTAssertEqual(msg, "Default branch 'main' does not exist in checkout")
}
}

func test_getIncomingVersions_no_default_branch() async throws {
// setup
// saving Package without Repository means it has no default branch
try await Package(id: .id0, url: "1".asGithubUrl.url).save(on: app.db)
let pkg = try await Package.fetchCandidate(app.db, id: .id0).get()

// MUT
do {
_ = try await Analyze.getIncomingVersions(client: app.client, logger: app.logger, package: pkg)
XCTFail("expected an analysisError to be thrown")
} catch let AppError.analysisError(.some(pkgId), msg) {
// validate
XCTAssertEqual(pkgId, .id0)
XCTAssertEqual(msg, "Package must have default branch")
}
}

func test_diffVersions() async throws {
//setup
Current.git.getTags = { _ in [.tag(1, 2, 3)] }
Current.git.hasBranch = { _, _ in true }
Current.git.revisionInfo = { ref, _ in
if ref == .branch("main") { return . init(commit: "sha.main", date: .t0) }
if ref == .tag(1, 2, 3) { return .init(commit: "sha.1.2.3", date: .t1) }
Expand Down Expand Up @@ -788,7 +885,7 @@ class AnalyzerTests: AppTestCase {
XCTAssertEqual(targets.map(\.type), [.regular, .executable])
}

func test_updatePackage() async throws {
func test_updatePackages() async throws {
// setup
let packages = try savePackages(on: app.db, ["1", "2"].asURLs)
.map(Joined<Package, Repository>.init(model:))
Expand Down Expand Up @@ -821,6 +918,7 @@ class AnalyzerTests: AppTestCase {
Current.git.firstCommitDate = { _ in .t0 }
Current.git.lastCommitDate = { _ in .t1 }
Current.git.getTags = { _ in [.tag(1, 0, 0), .tag(2, 0, 0)] }
Current.git.hasBranch = { _, _ in true }
Current.git.revisionInfo = { _, _ in .init(commit: "sha", date: .t0) }
Current.git.shortlog = { _ in
"""
Expand Down Expand Up @@ -879,7 +977,7 @@ class AnalyzerTests: AppTestCase {
// https://github.com/SwiftPackageIndex/SwiftPackageIndex-Server/issues/70
// setup
try savePackage(on: app.db, "1".asGithubUrl.url, processingStage: .ingestion)
let pkgs = try await Package.fetchCandidates(app.db, for: .analysis, limit: 10).get()
let pkgs = try await Package.fetchCandidates(app.db, for: .analysis, limit: 10)

let checkoutDir = Current.fileManager.checkoutsDirectory()
// claim every file exists, including our ficticious 'index.lock' for which
Expand Down Expand Up @@ -913,7 +1011,7 @@ class AnalyzerTests: AppTestCase {
// https://github.com/SwiftPackageIndex/SwiftPackageIndex-Server/issues/498
// setup
try savePackage(on: app.db, "1".asGithubUrl.url, processingStage: .ingestion)
let pkgs = try await Package.fetchCandidates(app.db, for: .analysis, limit: 10).get()
let pkgs = try await Package.fetchCandidates(app.db, for: .analysis, limit: 10)

let checkoutDir = Current.fileManager.checkoutsDirectory()
// claim every file exists, including our ficticious 'index.lock' for which
Expand Down Expand Up @@ -1230,6 +1328,7 @@ class AnalyzerTests: AppTestCase {
Current.fileManager.fileExists = { _ in true }
Current.git.commitCount = { _ in 2 }
Current.git.firstCommitDate = { _ in .t0 }
Current.git.hasBranch = { _, _ in true }
Current.git.lastCommitDate = { _ in .t1 }
struct Error: Swift.Error { }
Current.git.shortlog = { _ in
Expand Down Expand Up @@ -1335,6 +1434,7 @@ class AnalyzerTests: AppTestCase {
Current.fileManager.fileExists = { _ in true }
Current.git.commitCount = { _ in 2 }
Current.git.firstCommitDate = { _ in .t0 }
Current.git.hasBranch = { _, _ in true }
Current.git.lastCommitDate = { _ in .t1 }
struct Error: Swift.Error { }
Current.git.shortlog = { _ in
Expand Down Expand Up @@ -1454,6 +1554,7 @@ private struct Command: CustomStringConvertible {
case firstCommitDate
case lastCommitDate
case getTags
case hasBranch(String)
case reset
case resetToBranch(String)
case shortlog
Expand Down Expand Up @@ -1483,6 +1584,9 @@ private struct Command: CustomStringConvertible {
self.kind = .fetch
case .gitFirstCommitDate:
self.kind = .firstCommitDate
case _ where command.description.starts(with: "git show-ref --verify --quiet refs/heads/"):
let branch = String(command.description.split(separator: "/").last!)
self.kind = .hasBranch(branch)
case .gitLastCommitDate:
self.kind = .lastCommitDate
case .gitListTags:
Expand Down Expand Up @@ -1517,6 +1621,8 @@ private struct Command: CustomStringConvertible {
return "\(path): checkout \(ref)"
case .clone(let url):
return "\(path): clone \(url)"
case let .hasBranch(branch):
return "\(path): hasBranch \(branch)"
case .resetToBranch(let branch):
return "\(path): reset to \(branch)"
case .revisionInfo(let ref):
Expand Down
2 changes: 2 additions & 0 deletions Tests/AppTests/AnalyzerVersionThrottlingTests.swift
Original file line number Diff line number Diff line change
Expand Up @@ -166,6 +166,7 @@ class AnalyzerVersionThrottlingTests: AppTestCase {
var t: Date = .t0
Current.date = { t }
Current.git.getTags = { _ in [.branch("main")] }
Current.git.hasBranch = { _, _ in true }
let pkg = Package(url: "1".asGithubUrl.url)
try await pkg.save(on: app.db)
try await Repository(package: pkg, defaultBranch: "main").save(on: app.db)
Expand Down Expand Up @@ -217,6 +218,7 @@ class AnalyzerVersionThrottlingTests: AppTestCase {
// Leaving tags out of it for simplicity - they are tested specifically
// in test_throttle_ignore_tags above.
Current.git.getTags = { _ in [] }
Current.git.hasBranch = { _, _ in true }

// Little helper to simulate minimal version reconciliation
func runVersionReconciliation() async throws -> VersionDelta {
Expand Down
5 changes: 5 additions & 0 deletions Tests/AppTests/GitLiveTests.swift
Original file line number Diff line number Diff line change
Expand Up @@ -92,6 +92,11 @@ extension GitLiveTests {
)
}

func test_hasBranch() async throws {
try await XCTAssertEqualAsync(try await Git.hasBranch(.branch("master"), at: path), true)
try await XCTAssertEqualAsync(try await Git.hasBranch(.branch("main"), at: path), false)
}

func test_revisionInfo() async throws {
try await XCTAssertEqualAsync(try await Git.revisionInfo(.tag(0,5,2), at: path),
.init(commit: "178566b112afe6bef3770678f1bbab6e5c626993",
Expand Down
Loading