Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

[BEAM-13633] [Playground] Implement method to get a default example for each SDKs #16484

Merged
merged 46 commits into from
Mar 1, 2022
Merged
Show file tree
Hide file tree
Changes from 2 commits
Commits
Show all changes
46 commits
Select commit Hold shift + click to select a range
509b7ff
Implement method to get a default example for each SDKs
pavel-avilov Jan 12, 2022
e9cbe79
Add error handling
pavel-avilov Jan 12, 2022
68edd97
Added saving of precompiled objects catalog to cache at the server st…
Jan 12, 2022
ab16bea
Added caching of the catalog only in case of unspecified SDK
Jan 12, 2022
d181cce
Update regarding comments
Jan 13, 2022
5743386
Update regarding comments
Jan 13, 2022
38673a4
Simplified logging regarding comment
Jan 14, 2022
4071bdb
Get defaultExamplePath from the corresponding config
pavel-avilov Jan 14, 2022
3047469
Refactoring code
pavel-avilov Jan 14, 2022
d6e5d0b
Add the `link` field to response
pavel-avilov Jan 18, 2022
f80ebdd
Merge branch 'master' into BEAM-13633_default_ex_for_sdks
pavel-avilov Jan 19, 2022
e035006
Remove gjson;
pavel-avilov Jan 19, 2022
c3c5c79
Refactoring code
pavel-avilov Jan 19, 2022
931b79e
Merge remote-tracking branch 'origin/BEAM-13632-cache-examples-data' …
pavel-avilov Jan 20, 2022
29e6f61
Getting default precompiled object from cache
pavel-avilov Jan 21, 2022
5688841
Refactoring code
pavel-avilov Jan 21, 2022
43fc19b
Added saving of precompiled objects catalog to cache at the server st…
Jan 12, 2022
27b0157
Added caching of the catalog only in case of unspecified SDK
Jan 12, 2022
b9b77b9
Update regarding comments
Jan 13, 2022
2187918
Update regarding comments
Jan 13, 2022
3655716
Simplified logging regarding comment
Jan 14, 2022
7fe3d8b
Updates regarding comments
Jan 24, 2022
6830670
Update for environment_service_test.go
Jan 24, 2022
af655a5
Merge remote-tracking branch 'origin/BEAM-13632-cache-examples-data' …
pavel-avilov Jan 24, 2022
b95103c
Get default example from catalog
pavel-avilov Jan 24, 2022
f4ae9a7
GetCatalogFromCacheOrStorage method
pavel-avilov Jan 25, 2022
276ddd1
Merge branch 'master' into BEAM-13633_default_ex_for_sdks
pavel-avilov Jan 25, 2022
94a1613
Merge branch 'master' into BEAM-13633_default_ex_for_sdks
pavel-avilov Jan 26, 2022
1550e3a
Update licenses
pavel-avilov Jan 26, 2022
8e6e1e5
Merge branch 'master' into BEAM-13633_default_ex_for_sdks
pavel-avilov Feb 1, 2022
af3623c
Update licenses;
pavel-avilov Feb 1, 2022
a7d6ded
Merge branch 'master' into BEAM-13633_default_ex_for_sdks
Feb 7, 2022
3c8bd03
[BEAM-13633][Playground]
Feb 7, 2022
f273192
[BEAM-13633][Playground]
Feb 7, 2022
ebf5888
[BEAM-13633][Playground]
Feb 8, 2022
29c28b5
Merge branch 'master' into BEAM-13633_default_ex_for_sdks
Feb 8, 2022
e413153
[BEAM-13633][Playground]
Feb 8, 2022
da6baa0
Add code of the default example to response
pavel-avilov Feb 9, 2022
1ea1026
Revert "Add code of the default example to response"
pavel-avilov Feb 9, 2022
d8b7bdb
Refactoring code
pavel-avilov Feb 9, 2022
c189363
Refactoring code;
Feb 10, 2022
6e63cfb
Edit commentaries
pavel-avilov Feb 10, 2022
0bcb1c4
Refactoring code
pavel-avilov Feb 10, 2022
66a3ca5
Merge remote-tracking branch 'origin/master' into BEAM-13633_default_…
pavel-avilov Mar 1, 2022
52622a3
Merge branch 'master' into BEAM-13633_default_ex_for_sdks
pavel-avilov Mar 1, 2022
4f54530
Add bucket name to methods
pavel-avilov Mar 1, 2022
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
15 changes: 14 additions & 1 deletion playground/api/v1/api.proto
Original file line number Diff line number Diff line change
Expand Up @@ -184,7 +184,12 @@ message GetPrecompiledObjectLogsRequest{
string cloud_path = 1;
}

// GetListOfPrecompiledObjectsResponse represent the map between sdk and categories for the sdk.
// GetDefaultPrecompiledObjectRequest contains information of the needed PrecompiledObject sdk.
message GetDefaultPrecompiledObjectRequest {
Sdk sdk = 1;
}

// GetPrecompiledObjectsResponse represent the map between sdk and categories for the sdk.
message GetPrecompiledObjectsResponse{
repeated Categories sdk_categories = 1;
}
Expand All @@ -204,6 +209,11 @@ message GetPrecompiledObjectLogsResponse {
string output = 1;
}

// GetDefaultPrecompiledObjectResponse represents the default PrecompiledObject and his category for the sdk.
message GetDefaultPrecompiledObjectResponse {
PrecompiledObject precompiled_object = 1;
}

service PlaygroundService {

// Submit the job for an execution and get the pipeline uuid.
Expand Down Expand Up @@ -244,4 +254,7 @@ service PlaygroundService {

// Get the logs of an PrecompiledObject.
rpc GetPrecompiledObjectLogs(GetPrecompiledObjectLogsRequest) returns (GetPrecompiledObjectLogsResponse);

// Get the default precompile object for the sdk.
rpc GetDefaultPrecompiledObject(GetDefaultPrecompiledObjectRequest) returns (GetDefaultPrecompiledObjectResponse);
}
27 changes: 26 additions & 1 deletion playground/backend/cmd/server/controller.go
Original file line number Diff line number Diff line change
Expand Up @@ -262,7 +262,7 @@ func (controller *playgroundController) GetPrecompiledObjects(ctx context.Contex
// GetPrecompiledObjectCode returns the code of the specific example
func (controller *playgroundController) GetPrecompiledObjectCode(ctx context.Context, info *pb.GetPrecompiledObjectCodeRequest) (*pb.GetPrecompiledObjectCodeResponse, error) {
cd := cloud_bucket.New()
codeString, err := cd.GetPrecompiledObject(ctx, info.GetCloudPath())
codeString, err := cd.GetPrecompiledObjectCode(ctx, info.GetCloudPath())
if err != nil {
logger.Errorf("GetPrecompiledObjectCode(): cloud storage error: %s", err.Error())
return nil, errors.InternalError("Error during getting Precompiled Object's code", "Error with cloud connection")
Expand Down Expand Up @@ -294,3 +294,28 @@ func (controller *playgroundController) GetPrecompiledObjectLogs(ctx context.Con
response := pb.GetPrecompiledObjectLogsResponse{Output: logs}
return &response, nil
}

// GetDefaultPrecompiledObject returns the default precompile object for sdk.
func (controller *playgroundController) GetDefaultPrecompiledObject(ctx context.Context, info *pb.GetDefaultPrecompiledObjectRequest) (*pb.GetDefaultPrecompiledObjectResponse, error) {
switch info.Sdk {
case pb.Sdk_SDK_UNSPECIFIED, pb.Sdk_SDK_SCIO:
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I guess we can include SCIO as a supported SDK.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Done.

logger.Errorf("GetDefaultPrecompiledObject(): unimplemented sdk: %s\n", info.Sdk)
return nil, errors.InvalidArgumentError("Error during preparing", "Sdk is not implemented yet: %s", info.Sdk.String())
}

bucket := cloud_bucket.New()
precompiledObject, err := bucket.GetDefaultPrecompileObject(ctx, info.Sdk, controller.env.ApplicationEnvs.WorkingDir())
if err != nil {
logger.Errorf("GetDefaultPrecompileObject(): cloud storage error: %s", err.Error())
return nil, errors.InternalError("Error during getting default Precompiled Object", "Error with cloud connection")
}

response := pb.GetDefaultPrecompiledObjectResponse{PrecompiledObject: &pb.PrecompiledObject{
CloudPath: precompiledObject.CloudPath,
Name: precompiledObject.Name,
Description: precompiledObject.Description,
Type: precompiledObject.Type,
PipelineOptions: precompiledObject.PipelineOptions,
}}
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Shouldn't we return the code of the example as well? Or it will be requested from the frontend after receiving this response?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Yes, this information will be enough for frontend.

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Could you please also add the link field according to this one

return &response, nil
}
5 changes: 5 additions & 0 deletions playground/backend/configs/DEFAULT_EXAMPLES.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I am not sure that this file should be in configs folder. @KhaninArtur @ilya-kozyrev what do you think?

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I think it's a good place for this file. What place do you propose?

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Now configs folder contains files that use to configure each SDK (commands for compile and run steps). But this file contains constants for each SDK, so maybe it would be better to create constant values into the code and do not create one more config file?

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Hm, on the other hand, we can configure default examples from one place instead of looking for them in the code. What do you think about adding the default_example field to the corresponding .json config? E.g. add "default_example": "SDK_GO/MinimalWordCount", to the SDK_GO.json file.

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Sounds good.

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

@pavel-avilov could you please change the configs based on the discussion above?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Done.

"SDK_JAVA": "SDK_JAVA/MinimalWordCount",
"SDK_GO": "SDK_GO/MinimalWordCount",
"SDK_PYTHON": "SDK_PYTHON/WordCountWithMetrics"
}
571 changes: 358 additions & 213 deletions playground/backend/internal/api/v1/api.pb.go

Large diffs are not rendered by default.

38 changes: 38 additions & 0 deletions playground/backend/internal/api/v1/api_grpc.pb.go

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

68 changes: 56 additions & 12 deletions playground/backend/internal/cloud_bucket/precompiled_objects.go
Original file line number Diff line number Diff line change
Expand Up @@ -32,16 +32,18 @@ import (
)

const (
BucketName = "playground-precompiled-objects"
OutputExtension = "output"
LogsExtension = "log"
MetaInfoName = "meta.info"
Timeout = time.Second * 10
javaExtension = "java"
goExtension = "go"
pyExtension = "py"
scioExtension = "scala"
separatorsNumber = 2
BucketName = "playground-precompiled-objects"
OutputExtension = "output"
LogsExtension = "log"
MetaInfoName = "meta.info"
Timeout = time.Second * 10
javaExtension = "java"
goExtension = "go"
pyExtension = "py"
scioExtension = "scala"
separatorsNumber = 2
defaultExamplesConfigName = "DEFAULT_EXAMPLES.json"
configFolderName = "configs"
)

type ObjectInfo struct {
Expand Down Expand Up @@ -93,8 +95,8 @@ func New() *CloudStorage {
return &CloudStorage{}
}

// GetPrecompiledObject returns the source code of the example
func (cd *CloudStorage) GetPrecompiledObject(ctx context.Context, precompiledObjectPath string) (string, error) {
// GetPrecompiledObjectCode returns the source code of the example
func (cd *CloudStorage) GetPrecompiledObjectCode(ctx context.Context, precompiledObjectPath string) (string, error) {
extension, err := getFileExtensionBySdk(precompiledObjectPath)
if err != nil {
return "", err
Expand Down Expand Up @@ -173,6 +175,30 @@ func (cd *CloudStorage) GetPrecompiledObjects(ctx context.Context, targetSdk pb.
return &precompiledObjects, nil
}

// GetDefaultPrecompileObject returns the default precompiled object for the sdk
func (cd *CloudStorage) GetDefaultPrecompileObject(ctx context.Context, targetSdk pb.Sdk, workingDir string) (*ObjectInfo, error) {
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Suggested change
func (cd *CloudStorage) GetDefaultPrecompileObject(ctx context.Context, targetSdk pb.Sdk, workingDir string) (*ObjectInfo, error) {
func (cd *CloudStorage) GetDefaultPrecompiledObject(ctx context.Context, targetSdk pb.Sdk, workingDir string) (*ObjectInfo, error) {

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Done.

defaultExampleToSdk, err := getDefaultExamplesFromJson(workingDir)
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Add error handling.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Done.

if err != nil {
return nil, err
}
infoPath := filepath.Join(defaultExampleToSdk[targetSdk.String()], MetaInfoName)
metaInfo, err := cd.getFileFromBucket(ctx, infoPath, "")
if err != nil {
return nil, err
}

precompiledObject := ObjectInfo{}
err = json.Unmarshal(metaInfo, &precompiledObject)
if err != nil {
logger.Errorf("json.Unmarshal: %v", err.Error())
return nil, err
}

precompiledObject.CloudPath = filepath.Dir(infoPath)

return &precompiledObject, nil
}

// getPrecompiledObjectsDirs finds directories with precompiled objects
// Since there is no notion of directory at cloud storage, then
// to avoid duplicates of a base path (directory) need to store it in a set/map.
Expand Down Expand Up @@ -267,6 +293,9 @@ func getFileExtensionBySdk(precompiledObjectPath string) (string, error) {

// getFullFilePath get full path to the precompiled object file
func getFullFilePath(objectDir string, extension string) string {
if extension == "" {
return objectDir
}
precompiledObjectName := filepath.Base(objectDir) //the base of the object's directory matches the name of the file
fileName := strings.Join([]string{precompiledObjectName, extension}, ".")
filePath := filepath.Join(objectDir, fileName)
Expand All @@ -288,3 +317,18 @@ func getSdkName(path string) string {
sdkName := strings.Split(path, string(os.PathSeparator))[0] // the path of the form "sdkName/example/", where the first part is sdkName
return sdkName
}

// getDefaultExamplesFromJson reads a json file that contains information about default examples for sdk and converts him to map
func getDefaultExamplesFromJson(workingDir string) (map[string]string, error) {
defaultExampleToSdk := map[string]string{}
configPath := filepath.Join(workingDir, configFolderName, defaultExamplesConfigName)
file, err := ioutil.ReadFile(configPath)
if err != nil {
return nil, err
}
err = json.Unmarshal(file, &defaultExampleToSdk)
if err != nil {
return nil, err
}
return defaultExampleToSdk, nil
}
Original file line number Diff line number Diff line change
Expand Up @@ -18,13 +18,18 @@ package cloud_bucket
import (
pb "beam.apache.org/playground/backend/internal/api/v1"
"context"
"fmt"
"io/fs"
"os"
"path/filepath"
"reflect"
"testing"
)

const (
precompiledObjectPath = "SDK_JAVA/MinimalWordCount"
targetSdk = pb.Sdk_SDK_UNSPECIFIED
defaultExamplesConfig = "{\n \"SDK_JAVA\": \"1\",\n \"SDK_GO\": \"2\",\n \"SDK_PYTHON\": \"3\"\n}"
)

var bucket *CloudStorage
Expand All @@ -35,6 +40,35 @@ func init() {
ctx = context.Background()
}

func TestMain(m *testing.M) {
err := setup()
if err != nil {
panic(fmt.Errorf("error during test setup: %s", err.Error()))
}
defer teardown()
m.Run()
}

func setup() error {
err := os.Mkdir(configFolderName, fs.ModePerm)
if err != nil {
return err
}
filePath := filepath.Join(configFolderName, defaultExamplesConfigName)
err = os.WriteFile(filePath, []byte(defaultExamplesConfig), 0600)
if err != nil {
return err
}
return nil
}

func teardown() {
err := os.RemoveAll(configFolderName)
if err != nil {
panic(fmt.Errorf("error during test setup: %s", err.Error()))
}
}

func Test_getFullFilePath(t *testing.T) {
type args struct {
examplePath string
Expand Down Expand Up @@ -250,6 +284,50 @@ func Benchmark_GetPrecompiledObjectOutput(b *testing.B) {

func Benchmark_GetPrecompiledObject(b *testing.B) {
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Suggested change
func Benchmark_GetPrecompiledObject(b *testing.B) {
func Benchmark_GetPrecompiledObjectCode(b *testing.B) {

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Done

for i := 0; i < b.N; i++ {
_, _ = bucket.GetPrecompiledObject(ctx, precompiledObjectPath)
_, _ = bucket.GetPrecompiledObjectCode(ctx, precompiledObjectPath)
}
}

func Benchmark_GetDefaultPrecompileObject(b *testing.B) {
for i := 0; i < b.N; i++ {
_, _ = bucket.GetDefaultPrecompileObject(ctx, targetSdk, "")
}
}

func Test_getDefaultExamplesFromJson(t *testing.T) {
expectedMap := map[string]string{"SDK_JAVA": "1", "SDK_GO": "2", "SDK_PYTHON": "3"}
type args struct {
workingDir string
}
tests := []struct {
name string
args args
want map[string]string
wantErr bool
}{
{
name: "get object from json",
args: args{workingDir: ""},
want: expectedMap,
wantErr: false,
},
{
name: "error if wrong json path",
args: args{workingDir: "Wrong_path"},
want: nil,
wantErr: true,
},
}
for _, tt := range tests {
t.Run(tt.name, func(t *testing.T) {
got, err := getDefaultExamplesFromJson(tt.args.workingDir)
if (err != nil) != tt.wantErr {
t.Errorf("getDefaultExamplesFromJson() error = %v, wantErr %v", err, tt.wantErr)
return
}
if !reflect.DeepEqual(got, tt.want) {
t.Errorf("getDefaultExamplesFromJson() got = %v, want %v", got, tt.want)
}
})
}
}
Loading