Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

fix(media): filter first before getting git blob hash #1060

Merged
merged 4 commits into from
Dec 15, 2023
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 2 additions & 0 deletions src/constants/constants.ts
Original file line number Diff line number Diff line change
Expand Up @@ -2,24 +2,24 @@

import { config } from "@config/config"

export enum JobStatus {

Check warning on line 5 in src/constants/constants.ts

View workflow job for this annotation

GitHub Actions / lint

'JobStatus' is already declared in the upper scope on line 5 column 13

Check warning on line 5 in src/constants/constants.ts

View workflow job for this annotation

GitHub Actions / lint

'JobStatus' is already declared in the upper scope on line 5 column 13
Ready = "READY", // Ready to run jobs
Running = "RUNNING", // A job is running
Failed = "FAILED", // A job has failed and recovery is needed
}

export enum SiteStatus {

Check warning on line 11 in src/constants/constants.ts

View workflow job for this annotation

GitHub Actions / lint

'SiteStatus' is already declared in the upper scope on line 11 column 13

Check warning on line 11 in src/constants/constants.ts

View workflow job for this annotation

GitHub Actions / lint

'SiteStatus' is already declared in the upper scope on line 11 column 13
Empty = "EMPTY", // A site record site is being initialized
Initialized = "INITIALIZED",
Launched = "LAUNCHED",
}

export enum RedirectionTypes {

Check warning on line 17 in src/constants/constants.ts

View workflow job for this annotation

GitHub Actions / lint

'RedirectionTypes' is already declared in the upper scope on line 17 column 13

Check warning on line 17 in src/constants/constants.ts

View workflow job for this annotation

GitHub Actions / lint

'RedirectionTypes' is already declared in the upper scope on line 17 column 13
CNAME = "CNAME",
A = "A",
}

export enum CollaboratorRoles {

Check warning on line 22 in src/constants/constants.ts

View workflow job for this annotation

GitHub Actions / lint

'CollaboratorRoles' is already declared in the upper scope on line 22 column 13

Check warning on line 22 in src/constants/constants.ts

View workflow job for this annotation

GitHub Actions / lint

'CollaboratorRoles' is already declared in the upper scope on line 22 column 13
Admin = "ADMIN",
Contributor = "CONTRIBUTOR",
IsomerAdmin = "ISOMERADMIN",
Expand All @@ -30,7 +30,7 @@
CollaboratorRoles.IsomerAdmin
>

export enum ReviewRequestStatus {

Check warning on line 33 in src/constants/constants.ts

View workflow job for this annotation

GitHub Actions / lint

'ReviewRequestStatus' is already declared in the upper scope on line 33 column 13

Check warning on line 33 in src/constants/constants.ts

View workflow job for this annotation

GitHub Actions / lint

'ReviewRequestStatus' is already declared in the upper scope on line 33 column 13
Approved = "APPROVED",
Open = "OPEN",
Merged = "MERGED",
Expand Down Expand Up @@ -88,3 +88,5 @@
)
export const STAGING_BRANCH = "staging"
export const STAGING_LITE_BRANCH = "staging-lite"
export const PLACEHOLDER_FILE_NAME = ".keep"
export const GIT_SYSTEM_DIRECTORY = ".git"
84 changes: 62 additions & 22 deletions src/services/db/GitFileSystemService.ts
Original file line number Diff line number Diff line change
Expand Up @@ -32,12 +32,14 @@ import { MediaTypeError } from "@root/errors/MediaTypeError"
import { MediaFileOutput } from "@root/types"
import { GitHubCommitData } from "@root/types/commitData"
import type {
DirectoryContents,
GitCommitResult,
GitDirectoryItem,
GitFile,
} from "@root/types/gitfilesystem"
import type { IsomerCommitMessage } from "@root/types/github"
import { ALLOWED_FILE_EXTENSIONS } from "@root/utils/file-upload-utils"
import { getPaginatedDirectoryContents } from "@root/utils/files"

export default class GitFileSystemService {
private readonly git: SimpleGit
Expand Down Expand Up @@ -900,7 +902,7 @@ export default class GitFileSystemService {
mediaUrl: `${dataUrlPrefix},${file.content}`,
mediaPath: `${directoryName}/${fileName}`,
type: fileType,
addedTime: stats.birthtimeMs,
addedTime: stats.ctimeMs,
size: stats.size,
})
})
Expand All @@ -910,8 +912,11 @@ export default class GitFileSystemService {
listDirectoryContents(
repoName: string,
directoryPath: string,
branchName: string
): ResultAsync<GitDirectoryItem[], GitFileSystemError | NotFoundError> {
branchName: string,
page = 0,
limit = 0,
search = ""
): ResultAsync<DirectoryContents, GitFileSystemError | NotFoundError> {
const efsVolPath = this.getEfsVolPathFromBranch(branchName)
const isStaging = this.isStagingFromBranchName(branchName)
return this.getFilePathStats(
Expand Down Expand Up @@ -952,38 +957,73 @@ export default class GitFileSystemService {
const path = directoryPath === "" ? name : `${directoryPath}/${name}`
const type = isDirectory ? "dir" : "file"

return this.getGitBlobHash(repoName, path, isStaging)
.orElse(() => okAsync(""))
.andThen((sha) =>
ResultAsync.combine([
okAsync(sha),
this.getFilePathStats(
repoName,
path,
branchName !== STAGING_LITE_BRANCH
),
])
)
.andThen((shaAndStats) => {
const [sha, stats] = shaAndStats
return this.getFilePathStats(repoName, path, isStaging).andThen(
(stats) => {
const result: GitDirectoryItem = {
name,
type,
sha,
path,
size: type === "dir" ? 0 : stats.size,
addedTime: stats.birthtimeMs,
addedTime: stats.ctimeMs,
}

return okAsync(result)
})
}
)
})

return ResultAsync.combine(resultAsyncs)
})
.andThen((directoryItems) =>
.andThen((directoryContents) =>
okAsync(
getPaginatedDirectoryContents(directoryContents, page, limit, search)
)
)
.andThen((paginatedDirectoryContents) => {
const directories = paginatedDirectoryContents.directories.map(
(directory) =>
this.getGitBlobHash(repoName, directory.path, isStaging)
.orElse(() => okAsync(""))
.andThen((sha) => {
const result: GitDirectoryItem = {
...directory,
sha,
}

return okAsync(result)
})
)

const files = paginatedDirectoryContents.files.map((file) =>
this.getGitBlobHash(repoName, file.path, isStaging)
.orElse(() => okAsync(""))
.andThen((sha) => {
const result: GitDirectoryItem = {
...file,
sha,
}

return okAsync(result)
})
)

return ResultAsync.combine([
ResultAsync.combine(directories),
ResultAsync.combine(files),
okAsync(paginatedDirectoryContents.total),
])
})
.andThen(([directories, files, total]) =>
// Note: The sha is empty if the file is not tracked by Git
okAsync(directoryItems.filter((item) => item.sha !== ""))
// This may result in the number of files being less than the requested
// limit (if limit is greater than 0), but the trade-off is acceptable
// here because the user can use pagination to get the next set of files,
// which is guaranteed to be a fresh set of files
okAsync({
directories: directories.filter((directory) => directory.sha !== ""),
files: files.filter((file) => file.sha !== ""),
total,
})
)
}

Expand Down
1 change: 1 addition & 0 deletions src/services/db/GitHubService.ts
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,7 @@ import { STAGING_BRANCH } from "@root/constants"
import logger from "@root/logger/logger"
import { GitCommitResult } from "@root/types/gitfilesystem"
import { RawGitTreeEntry } from "@root/types/github"
import { getPaginatedDirectoryContents } from "@root/utils/files"
seaerchin marked this conversation as resolved.
Show resolved Hide resolved

import * as ReviewApi from "./review"

Expand Down
67 changes: 11 additions & 56 deletions src/services/db/RepoService.ts
Original file line number Diff line number Diff line change
Expand Up @@ -10,67 +10,23 @@ import UserWithSiteSessionData from "@root/classes/UserWithSiteSessionData"
import { FEATURE_FLAGS, STAGING_BRANCH } from "@root/constants"
import { GitHubCommitData } from "@root/types/commitData"
import type {
DirectoryContents,
GitCommitResult,
GitDirectoryItem,
GitFile,
} from "@root/types/gitfilesystem"
import { RawGitTreeEntry } from "@root/types/github"
import { MediaDirOutput, MediaFileOutput, MediaType } from "@root/types/media"
import { getPaginatedDirectoryContents } from "@root/utils/files"
import { getMediaFileInfo } from "@root/utils/media-utils"

import GitFileCommitService from "./GitFileCommitService"
import GitFileSystemService from "./GitFileSystemService"
import GitHubService from "./GitHubService"
import * as ReviewApi from "./review"

const PLACEHOLDER_FILE_NAME = ".keep"
const BRANCH_REF = config.get("github.branchRef")

const getPaginatedDirectoryContents = (
directoryContents: GitDirectoryItem[],
page: number,
limit = 15,
search = ""
): {
directories: GitDirectoryItem[]
files: GitDirectoryItem[]
total: number
} => {
const subdirectories = directoryContents.filter((item) => item.type === "dir")
const files = directoryContents.filter(
(item) => item.type === "file" && item.name !== PLACEHOLDER_FILE_NAME
)

let sortedFiles = _(files)
// Note: We are sorting by name here to maintain compatibility for
// GitHub-login users, since it is very expensive to get the addedTime for
// each file from the GitHub API. The files will be sorted by addedTime in
// milliseconds for GGS users, so they will never see the alphabetical
// sorting.
.orderBy(
[(file) => file.addedTime, (file) => file.name.toLowerCase()],
["desc", "asc"]
)

if (search) {
sortedFiles = sortedFiles.filter((file) =>
file.name.toLowerCase().includes(search.toLowerCase())
)
}
const totalLength = sortedFiles.value().length

const paginatedFiles = sortedFiles
.drop(page * limit)
.take(limit)
.value()

return {
directories: subdirectories,
files: paginatedFiles,
total: totalLength,
}
}

// TODO: update the typings here to remove `any`.
// We can type as `unknown` if required.

Expand Down Expand Up @@ -318,7 +274,7 @@ export default class RepoService extends GitHubService {
throw result.error
}

return result.value
return [...result.value.directories, ...result.value.files]
}

return super.readDirectory(sessionData, {
Expand All @@ -343,7 +299,7 @@ export default class RepoService extends GitHubService {
const { siteName } = sessionData
const defaultBranch = STAGING_BRANCH
logger.debug(`Reading media directory: ${directoryName}`)
let dirContent: GitDirectoryItem[] = []
let dirContent: DirectoryContents

if (
sessionData.growthbook?.getFeatureValue(
Expand All @@ -354,7 +310,10 @@ export default class RepoService extends GitHubService {
const result = await this.gitFileSystemService.listDirectoryContents(
siteName,
directoryName,
defaultBranch
defaultBranch,
page,
limit,
search
)

if (result.isErr()) {
Expand All @@ -363,17 +322,13 @@ export default class RepoService extends GitHubService {

dirContent = result.value
} else {
dirContent = await super.readDirectory(sessionData, {
const contents = await super.readDirectory(sessionData, {
directoryName,
})
dirContent = getPaginatedDirectoryContents(contents, page, limit, search)
}

const { directories, files, total } = getPaginatedDirectoryContents(
dirContent,
page,
limit,
search
)
const { directories, files, total } = dirContent

return {
directories: directories.map(({ name, type }) => ({
Expand Down
50 changes: 31 additions & 19 deletions src/services/db/__tests__/GitFileSystemService.spec.ts
Original file line number Diff line number Diff line change
Expand Up @@ -74,15 +74,15 @@ describe("GitFileSystemService", () => {
MockSimpleGit.cwd.mockReturnValueOnce({
revparse: jest.fn().mockResolvedValueOnce("another-fake-dir-hash"),
})
MockSimpleGit.cwd.mockReturnValueOnce({
revparse: jest.fn().mockResolvedValueOnce("another-fake-file-hash"),
})
MockSimpleGit.cwd.mockReturnValueOnce({
revparse: jest.fn().mockResolvedValueOnce("fake-dir-hash"),
})
MockSimpleGit.cwd.mockReturnValueOnce({
revparse: jest.fn().mockResolvedValueOnce("fake-empty-dir-hash"),
})
MockSimpleGit.cwd.mockReturnValueOnce({
revparse: jest.fn().mockResolvedValueOnce("another-fake-file-hash"),
})

const expectedFakeDir: GitDirectoryItem = {
name: "fake-dir",
Expand Down Expand Up @@ -129,9 +129,10 @@ describe("GitFileSystemService", () => {
"",
DEFAULT_BRANCH
)
const actual = result
._unsafeUnwrap()
.sort((a, b) => a.name.localeCompare(b.name))
const actual = [
...result._unsafeUnwrap().directories,
...result._unsafeUnwrap().files,
].sort((a, b) => a.name.localeCompare(b.name))

expect(actual).toMatchObject([
expectedAnotherFakeDir,
Expand All @@ -146,20 +147,20 @@ describe("GitFileSystemService", () => {
revparse: jest.fn().mockRejectedValueOnce(new GitError()),
})
MockSimpleGit.cwd.mockReturnValueOnce({
revparse: jest.fn().mockResolvedValueOnce("another-fake-file-hash"),
revparse: jest.fn().mockRejectedValueOnce(new GitError()),
})
MockSimpleGit.cwd.mockReturnValueOnce({
revparse: jest.fn().mockResolvedValueOnce("fake-dir-hash"),
revparse: jest.fn().mockResolvedValueOnce("fake-empty-dir-hash"),
})
MockSimpleGit.cwd.mockReturnValueOnce({
revparse: jest.fn().mockRejectedValueOnce(new GitError()),
revparse: jest.fn().mockResolvedValueOnce("another-fake-file-hash"),
})

const expectedFakeDir: GitDirectoryItem = {
name: "fake-dir",
name: "fake-empty-dir",
type: "dir",
sha: "fake-dir-hash",
path: "fake-dir",
sha: "fake-empty-dir-hash",
path: "fake-empty-dir",
size: 0,
addedTime: fs.statSync(`${EFS_VOL_PATH_STAGING}/fake-repo/fake-dir`)
.ctimeMs,
Expand All @@ -181,9 +182,10 @@ describe("GitFileSystemService", () => {
DEFAULT_BRANCH
)

const actual = result
._unsafeUnwrap()
.sort((a, b) => a.name.localeCompare(b.name))
const actual = [
...result._unsafeUnwrap().directories,
...result._unsafeUnwrap().files,
].sort((a, b) => a.name.localeCompare(b.name))

expect(actual).toMatchObject([expectedAnotherFakeFile, expectedFakeDir])
})
Expand All @@ -202,23 +204,33 @@ describe("GitFileSystemService", () => {
revparse: jest.fn().mockRejectedValueOnce(new GitError()),
})

const actual = await GitFileSystemService.listDirectoryContents(
const result = await GitFileSystemService.listDirectoryContents(
"fake-repo",
"",
DEFAULT_BRANCH
)

expect(actual._unsafeUnwrap()).toHaveLength(0)
const actual = [
...result._unsafeUnwrap().directories,
...result._unsafeUnwrap().files,
]

expect(actual).toHaveLength(0)
})

it("should return an empty result if the directory is empty", async () => {
const actual = await GitFileSystemService.listDirectoryContents(
const result = await GitFileSystemService.listDirectoryContents(
"fake-repo",
"fake-empty-dir",
DEFAULT_BRANCH
)

expect(actual._unsafeUnwrap()).toHaveLength(0)
const actual = [
...result._unsafeUnwrap().directories,
...result._unsafeUnwrap().files,
]

expect(actual).toHaveLength(0)
})

it("should return a GitFileSystemError if the path is not a directory", async () => {
Expand Down
Loading
Loading