Skip to content

[webcrawler] Support emitting non HTML documents (like PDFs...) (#739) #611

[webcrawler] Support emitting non HTML documents (like PDFs...) (#739)

[webcrawler] Support emitting non HTML documents (like PDFs...) (#739) #611

# Copyright DataStax, Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
name: Deploy
on:
push:
branches:
- main
jobs:
deploy:
name: Deploy
runs-on: LangStream-4-cores
timeout-minutes: 20
steps:
- name: Configure AWS credentials
uses: aws-actions/configure-aws-credentials@v2
with:
aws-access-key-id: ${{ secrets.ECR_AWS_ACCESS_KEY_ID }}
aws-secret-access-key: ${{ secrets.ECR_AWS_SECRET_ACCESS_KEY }}
aws-region: us-east-1
- name: Login to Amazon ECR Public
id: login-ecr
uses: aws-actions/amazon-ecr-login@v1
with:
registry-type: public
- name: Checkout
uses: actions/checkout@v2
- name: Setup jdk
uses: actions/setup-java@v3
with:
distribution: 'temurin'
java-version: '17.x'
- name: Init maven repo
uses: actions/cache@v2
with:
path: ~/.m2/repository
key: ${{ runner.os }}-maven-${{ hashFiles('**/pom.xml') }}
restore-keys: |
${{ runner.os }}-maven-
- name: Build
run: |
chmod +x mvnw
./docker/build.sh
- name: Push to ECR
run: |
repo=public.ecr.aws/y3i6u2n7/datastax-public
tag_and_push() {
image=$1
docker tag langstream/$image:latest-dev $repo/$image:latest
docker push $repo/$image:latest
}
tag_and_push langstream-runtime
tag_and_push langstream-cli
tag_and_push langstream-deployer
tag_and_push langstream-control-plane
tag_and_push langstream-api-gateway