Updated

naeemaa00 · naeemaa00 · commit 9e68a854fb27 · 2024-02-09T07:33:42.000+05:30
diff --git a/AWS_Bedrock_Stability_AI_Imagegenerators/010.png b/AWS_Bedrock_Stability_AI_Imagegenerators/010.png
diff --git a/AWS_Bedrock_Stability_AI_Imagegenerators/errorsNoted.txt b/AWS_Bedrock_Stability_AI_Imagegenerators/errorsNoted.txt
@@ -0,0 +1,5 @@
+1. A client error occured: generation_error
+sagemaker_inference.errors.BaseInferenceToolkitError: (400, 'generation_error', 'image dimensions must be multiples of 64, got 300x253')
+
+2. A client error occured: generation_error
+sagemaker_inference.errors.BaseInferenceToolkitError: (400, 'generation_error', 'image too large, 1590226>1048576 pixels')
diff --git a/AWS_Bedrock_Stability_AI_Imagegenerators/imagetoimage.py b/AWS_Bedrock_Stability_AI_Imagegenerators/imagetoimage.py
@@ -0,0 +1,114 @@
+# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
+# SPDX-License-Identifier: Apache-2.0
+"""
+Shows how to generate an image from a reference image with SDXL 1.0 (on demand).
+"""
+import base64
+import io
+import json
+import logging
+import boto3
+from PIL import Image
+
+from botocore.exceptions import ClientError
+
+class ImageError(Exception):
+    "Custom exception for errors returned by SDXL"
+    def __init__(self, message):
+        self.message = message
+
+
+logger = logging.getLogger(__name__)
+logging.basicConfig(level=logging.INFO)
+
+
+def generate_image(model_id, body):
+    """
+    Generate an image using SDXL 1.0 on demand.
+    Args:
+        model_id (str): The model ID to use.
+        body (str) : The request body to use.
+    Returns:
+        image_bytes (bytes): The image generated by the model.
+    """
+
+    logger.info("Generating image with SDXL model %s", model_id)
+
+    bedrock = boto3.client(service_name='bedrock-runtime')
+   
+    accept = "application/json"
+    content_type = "application/json"
+
+    response = bedrock.invoke_model(
+        body=body, modelId=model_id, accept=accept, contentType=content_type
+    )
+    response_body = json.loads(response.get("body").read())
+    print(response_body['result'])
+
+    base64_image = response_body.get("artifacts")[0].get("base64")
+    base64_bytes = base64_image.encode('ascii')
+    image_bytes = base64.b64decode(base64_bytes)
+
+    finish_reason = response_body.get("artifacts")[0].get("finishReason")
+
+    if finish_reason == 'ERROR' or finish_reason == 'CONTENT_FILTERED':
+        raise ImageError(f"Image generation error. Error code is {finish_reason}")
+
+
+    logger.info("Successfully generated image withvthe SDXL 1.0 model %s", model_id)
+
+    return image_bytes
+
+
+
+def main():
+    """
+    Entrypoint for SDXL example.
+    """
+
+    logging.basicConfig(level = logging.INFO,
+                        format = "%(levelname)s: %(message)s")
+
+    model_id='stability.stable-diffusion-xl-v1'
+
+    prompt="""Corporate Meeting room with lights on."""
+
+    # Read reference image from file and encode as base64 strings.
+    with open("D:/VSCode/GitRepos/ExampleFlaskApp/static/images/bill.png", "rb") as image_file:
+        init_image = base64.b64encode(image_file.read()).decode('utf8')
+
+    # Create request body.
+    body=json.dumps({
+        "text_prompts": [
+        {
+        "text": prompt
+        }
+    ],
+    "init_image": init_image,
+    "style_preset" : "isometric"
+    })
+
+    try:
+        print(f"Generating image with SDXL model {model_id}... 1")
+        image_bytes=generate_image(model_id = model_id, body = body)
+        print(f"Generating image with SDXL model {model_id}... 2")
+        image = Image.open(io.BytesIO(image_bytes))
+        image.show()
+
+
+    except ClientError as err:
+        message=err.response["Error"]["Message"]
+        logger.error("A client error occurred: %s", message)
+        print("A client error occured: " +
+              format(message))
+    except ImageError as err:
+        logger.error(err.message)
+        print(err.message)
+
+    else:
+        print(f"Finished generating text with SDXL model {model_id}.")
+
+
+if __name__ == "__main__":
+    main()
+
diff --git a/AWS_ETL_Job_In_Notebook/gluelab-lab3-etl-job.ipynb b/AWS_ETL_Job_In_Notebook/gluelab-lab3-etl-job.ipynb
@@ -0,0 +1,190 @@
+{
+	"cells": [
+		{
+			"cell_type": "markdown",
+			"metadata": {
+				"deletable": false,
+				"editable": false,
+				"trusted": true
+			},
+			"source": [
+				"\n",
+				"# Glue Studio Notebook\n",
+				"You are now running a **Glue Studio** notebook; before you can start using your notebook you *must* start an interactive session.\n",
+				"\n",
+				"## Available Magics\n",
+				"|          Magic              |   Type       |                                                                        Description                                                                        |\n",
+				"|-----------------------------|--------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------|\n",
+				"| %%configure                 |  Dictionary  |  A json-formatted dictionary consisting of all configuration parameters for a session. Each parameter can be specified here or through individual magics. |\n",
+				"| %profile                    |  String      |  Specify a profile in your aws configuration to use as the credentials provider.                                                                          |\n",
+				"| %iam_role                   |  String      |  Specify an IAM role to execute your session with.                                                                                                        |\n",
+				"| %region                     |  String      |  Specify the AWS region in which to initialize a session                                                                                                  |\n",
+				"| %session_id                 |  String      |  Returns the session ID for the running session.                                                                                                          |\n",
+				"| %connections                |  List        |  Specify a comma separated list of connections to use in the session.                                                                                     |\n",
+				"| %additional_python_modules  |  List        |  Comma separated list of pip packages, s3 paths or private pip arguments.                                                                                 |\n",
+				"| %extra_py_files             |  List        |  Comma separated list of additional Python files from S3.                                                                                                 |\n",
+				"| %extra_jars                 |  List        |  Comma separated list of additional Jars to include in the cluster.                                                                                       |\n",
+				"| %number_of_workers          |  Integer     |  The number of workers of a defined worker_type that are allocated when a job runs. worker_type must be set too.                                          |\n",
+				"| %worker_type                |  String      |  Standard, G.1X, *or* G.2X. number_of_workers must be set too. Default is G.1X                                                                            |\n",
+				"| %glue_version               |  String      |  The version of Glue to be used by this session. Currently, the only valid options are 2.0 and 3.0 (eg: %glue_version 2.0)                                |\n",
+				"| %security_config            |  String      |  Define a security configuration to be used with this session.                                                                                            |\n",
+				"| %sql                        |  String      |  Run SQL code. All lines after the initial %%sql magic will be passed as part of the SQL code.                                                            |\n",
+				"| %streaming                  |  String      |  Changes the session type to Glue Streaming.                                                                                                              |\n",
+				"| %etl                        |  String      |   Changes the session type to Glue ETL.                                                                                                                   |\n",
+				"| %status                     |              |  Returns the status of the current Glue session including its duration, configuration and executing user / role.                                          |\n",
+				"| %stop_session               |              |  Stops the current session.                                                                                                                               |\n",
+				"| %list_sessions              |              |  Lists all currently running sessions by name and ID.                                                                                                     |\n",
+				"| %spark_conf                 |  String      |  Specify custom spark configurations for your session. E.g. %spark_conf spark.serializer=org.apache.spark.serializer.KryoSerializer                       |"
+			]
+		},
+		{
+			"cell_type": "code",
+			"execution_count": null,
+			"metadata": {
+				"trusted": true,
+				"vscode": {
+					"languageId": "python_glue_session"
+				}
+			},
+			"outputs": [],
+			"source": [
+				"# Adding required libraries and extra jars to the job -   # <------- PLEASE REPLACE ${BUCKET_NAME} BELOW!!!\n",
+				"\n",
+				"%extra_py_files s3://${BUCKET_NAME}/library/pycountry_convert.zip\n",
+				"%extra_jars s3://crawler-public/json/serde/json-serde.jar\n",
+				"\n",
+				"# Adding required properties to the job - # <------- PLEASE REPLACE ${BUCKET_NAME} BELOW!!!\n",
+				"\n",
+				"%%configure \n",
+				"{\n",
+				"  \"--enable-spark-ui\": \"true\",\n",
+				"  \"--spark-event-logs-path\": \"s3://${BUCKET_NAME}/output/lab3/sparklog/\",\n",
+				"  \"max_retries\": \"0\"         \n",
+				"}"
+			]
+		},
+		{
+			"cell_type": "code",
+			"execution_count": null,
+			"metadata": {
+				"editable": true,
+				"trusted": true,
+				"vscode": {
+					"languageId": "python_glue_session"
+				}
+			},
+			"outputs": [],
+			"source": [
+				"#Importing all the basic Glue, Spark libraries \n",
+				"\n",
+				"import sys\n",
+				"from awsglue.transforms import *\n",
+				"from awsglue.utils import getResolvedOptions\n",
+				"from pyspark.context import SparkContext\n",
+				"from awsglue.context import GlueContext\n",
+				"from awsglue.dynamicframe import DynamicFrame\n",
+				"from awsglue.job import Job\n",
+				"\n",
+				"# Important further required libraries\n",
+				"\n",
+				"from pyspark.sql.functions import udf, col\n",
+				"from pyspark.sql.types import IntegerType, StringType\n",
+				"from pyspark import SparkContext\n",
+				"from pyspark.sql import SQLContext\n",
+				"from datetime import datetime\n",
+				"\n",
+				"# Starting Spark/Glue Context\n",
+				"\n",
+				"sc = SparkContext.getOrCreate()\n",
+				"glueContext = GlueContext(sc)\n",
+				"spark = glueContext.spark_session\n",
+				"job = Job(glueContext)"
+			]
+		},
+		{
+			"cell_type": "code",
+			"execution_count": null,
+			"metadata": {
+				"trusted": true,
+				"vscode": {
+					"languageId": "python_glue_session"
+				}
+			},
+			"outputs": [],
+			"source": [
+				"# Important pycountry_convert function from the external python library (pycountry_convert.zip)\n",
+				"\n",
+				"from pycountry_convert import (\n",
+				"    convert_country_alpha2_to_country_name,\n",
+				"    convert_country_alpha2_to_continent,\n",
+				"    convert_country_name_to_country_alpha2,\n",
+				"    convert_country_alpha3_to_country_alpha2,\n",
+				")\n",
+				"\n",
+				"\n",
+				"# Defining the function code\n",
+				"def get_country_code2(country_name):\n",
+				"    country_code2 = 'US'\n",
+				"    try:\n",
+				"        country_code2 = convert_country_name_to_country_alpha2(country_name)\n",
+				"    except KeyError:\n",
+				"        country_code2 = ''\n",
+				"    return country_code2\n",
+				"\n",
+				"# leveraging the Country Code UDF\n",
+				"\n",
+				"udf_get_country_code2 = udf(lambda z: get_country_code2(z), StringType())\n",
+				"\n",
+				"\n",
+				"# Reading the dataset into a DataFrame\n",
+				"s3_bucket = \"s3://${BUCKET_NAME}/\"                              # <------- PLEASE REPLACE ONLY THE ${BUCKET_NAME} HERE (Keep the \"s3://\" and the final \"/\" part)!!!\n",
+				"job_time_string = datetime.now().strftime(\"%Y%m%d%H%M%S\")\n",
+				"\n",
+				"df = spark.read.load(s3_bucket + \"input/lab2/sample.csv\", \n",
+				"                     format=\"csv\", \n",
+				"                     sep=\",\", \n",
+				"                     inferSchema=\"true\", \n",
+				"                     header=\"true\")\n",
+				"\n",
+				"# Performing a transformation that adds a new Country Code column to the dataframe based on the Country Code UDF output\n",
+				"\n",
+				"new_df = df.withColumn('country_code_2', udf_get_country_code2(col(\"country\")))"
+			]
+		},
+		{
+			"cell_type": "code",
+			"execution_count": null,
+			"metadata": {
+				"trusted": true,
+				"vscode": {
+					"languageId": "python_glue_session"
+				}
+			},
+			"outputs": [],
+			"source": [
+				"# Sinking the data into another S3 bucket path\n",
+				"\n",
+				"new_df.write.csv(s3_bucket + \"/output/lab3/notebook/\" + job_time_string + \"/\")"
+			]
+		}
+	],
+	"metadata": {
+		"kernelspec": {
+			"display_name": "Glue PySpark",
+			"language": "python",
+			"name": "glue_pyspark"
+		},
+		"language_info": {
+			"codemirror_mode": {
+				"name": "python",
+				"version": 3
+			},
+			"file_extension": ".py",
+			"mimetype": "text/x-python",
+			"name": "Python_Glue_Session",
+			"pygments_lexer": "python3"
+		}
+	},
+	"nbformat": 4,
+	"nbformat_minor": 4
+}
diff --git a/AWS_ETL_Job_In_Notebook/test.py b/AWS_ETL_Job_In_Notebook/test.py
@@ -0,0 +1,2 @@
+print("hello world")
+print("hello world 2")
diff --git a/AWS_MultiSource_Merge_Redshift/SQLCommands.sql b/AWS_MultiSource_Merge_Redshift/SQLCommands.sql
@@ -0,0 +1,20 @@
+create table workerslist (
+  ID varchar(100) not null,
+  Name  varchar(100) not null,
+  Description varchar(100) not null,
+  Email  varchar(100) not null,
+  Phone  varchar(100) not null,
+  Amount varchar(100) not null,
+  colo varchar(100) not null,
+  col1  varchar(100) not null,
+  col2 varchar(100) not null,
+  col3  varchar(100) not null,
+  col4  varchar(100) not null,
+  col5 varchar(100) not null
+)
+
+
+SELECT *
+FROM DataSource2
+LEFT JOIN DataSource1 ON  DataSource1.col0 = DataSource2.id
+
diff --git a/AWS_MultiSource_Merge_Redshift/TestReport.csv b/AWS_MultiSource_Merge_Redshift/TestReport.csv
@@ -0,0 +1,18 @@
+ID,Name,Description,Email,Phone,Amount
+1,dsfgf,Activity unit,dgfsfg@gmail.com,9.46E+13,1.23E+15
+2,xyz1,Rolling mean employees,dfsd@gmail.com,9.15E+12,1.23E+15
+3,xyz2,Salaries and wages paid,drgdth@gmail.com,94534635633,1.23E+15
+4,dsvgs,"Sales, government funding, grants and subsidies",hthfgtth@gmail.com,94534635633,1.23E+15
+5,xyz4,Total income,3456tr@gmail.com,94534635633,1.23E+15
+6,xyz5,Total expenditure,dsgdfg@gmail.com,94534635633,1.23E+15
+7,dsdf,Operating profit before tax,yiutrhgr@gmail.com,94534635633,1.23E+15
+8,xyz8,Total assets,gfdg@gmail.com,94534635633,1.23E+15
+9,xyz9,Fixed tangible assets,34565ytr@gmail.com,94534635633,1.23E+15
+10,xyz10,Activity unit,sgfgdf@gmail.com,94534635633,1.23E+15
+11,zzzz2323241,testing,qetrfw@gmail.com,94534635633,1.23E+15
+12,ewrwerwee,testing 2,wrgdr@gmail.com,94534635633,1.23E+15
+13,rtt,fgdfg,e5ye@gmail.com,94534635633,1.23E+15
+14,dg,ett,trea@gmail.com,94534635633,1.23E+15
+15,grgf,dgdg,dgdf@gmail.com,94534635633,1.23E+15
+16,rgr,fdsgfsd,dvd@gmail.com,94534635633,1.23E+15
+17,fgg,dgdg,cvcv@gmail.com,94534635633,1.23E+15
diff --git a/AWS_MultiSource_Merge_Redshift/TestReport2.csv b/AWS_MultiSource_Merge_Redshift/TestReport2.csv
@@ -0,0 +1,18 @@
+col0,col1,col2,col3,col4,col5
+1,dsfgf,Activity unit,dgfsfg@gmail.com,9.46E+13,1.23E+15
+2,xyz1,Rolling mean employees,dfsd@gmail.com,9.15E+12,1.23E+15
+3,xyz2,Salaries and wages paid,drgdth@gmail.com,94534635633,1.23E+15
+4,dsvgs,"Sales, government funding, grants and subsidies",hthfgtth@gmail.com,94534635633,1.23E+15
+5,xyz4,Total income,3456tr@gmail.com,94534635633,1.23E+15
+6,xyz5,Total expenditure,dsgdfg@gmail.com,94534635633,1.23E+15
+7,dsdf,Operating profit before tax,yiutrhgr@gmail.com,94534635633,1.23E+15
+8,xyz8,Total assets,gfdg@gmail.com,94534635633,1.23E+15
+9,xyz9,Fixed tangible assets,34565ytr@gmail.com,94534635633,1.23E+15
+10,xyz10,Activity unit,sgfgdf@gmail.com,94534635633,1.23E+15
+11,zzzz2323241,testing,qetrfw@gmail.com,94534635633,1.23E+15
+12,ewrwerwee,testing 2,wrgdr@gmail.com,94534635633,1.23E+15
+13,rtt,fgdfg,e5ye@gmail.com,94534635633,1.23E+15
+14,dg,ett,trea@gmail.com,94534635633,1.23E+15
+15,grgf,dgdg,dgdf@gmail.com,94534635633,1.23E+15
+16,rgr,fdsgfsd,dvd@gmail.com,94534635633,1.23E+15
+17,fgg,dgdg,cvcv@gmail.com,94534635633,1.23E+15
diff --git a/AWS_RDS_Arora_Serverless/SQLCommands.sql b/AWS_RDS_Arora_Serverless/SQLCommands.sql
diff --git a/AWS_Streaming_Glue_Job/glueworkshop-lab4-streaming-job.py b/AWS_Streaming_Glue_Job/glueworkshop-lab4-streaming-job.py

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+print("hello world")`
	`2`	`+print("hello world 2")`
-Original file line number
+Diff line change
@@ @@ -0,0 +1,18 @@ @@
 +ID,Name,Description,Email,Phone,Amount
 +1,dsfgf,Activity unit,[email protected],9.46E+13,1.23E+15
 +2,xyz1,Rolling mean employees,[email protected],9.15E+12,1.23E+15
 +3,xyz2,Salaries and wages paid,[email protected],94534635633,1.23E+15
 +4,dsvgs,"Sales, government funding, grants and subsidies",[email protected],94534635633,1.23E+15
 +5,xyz4,Total income,[email protected],94534635633,1.23E+15
 +6,xyz5,Total expenditure,[email protected],94534635633,1.23E+15
 +7,dsdf,Operating profit before tax,[email protected],94534635633,1.23E+15
 +8,xyz8,Total assets,[email protected],94534635633,1.23E+15
 +9,xyz9,Fixed tangible assets,[email protected],94534635633,1.23E+15
 +10,xyz10,Activity unit,[email protected],94534635633,1.23E+15
 +11,zzzz2323241,testing,[email protected],94534635633,1.23E+15
 +12,ewrwerwee,testing 2,[email protected],94534635633,1.23E+15
 +13,rtt,fgdfg,[email protected],94534635633,1.23E+15
 +14,dg,ett,[email protected],94534635633,1.23E+15
 +15,grgf,dgdg,[email protected],94534635633,1.23E+15
 +16,rgr,fdsgfsd,[email protected],94534635633,1.23E+15
 +17,fgg,dgdg,[email protected],94534635633,1.23E+15