lambdaworks
diff --git a/‎README.md
Lines changed: 27 additions & 4 deletions b/‎README.md
Lines changed: 27 additions & 4 deletions
diff --git a/‎docs/overview/aggregations/elastic_aggregation_sampler.md
Lines changed: 40 additions & 0 deletions b/‎docs/overview/aggregations/elastic_aggregation_sampler.md
Lines changed: 40 additions & 0 deletions
diff --git a/‎docs/overview/requests/elastic_request_bulk.md
Lines changed: 33 additions & 9 deletions b/‎docs/overview/requests/elastic_request_bulk.md
Lines changed: 33 additions & 9 deletions
diff --git a/‎modules/example/src/main/scala/example/RepositoriesElasticsearch.scala
Lines changed: 10 additions & 1 deletion b/‎modules/example/src/main/scala/example/RepositoriesElasticsearch.scala
Lines changed: 10 additions & 1 deletion
diff --git a/‎modules/example/src/main/scala/example/api/Repositories.scala
Lines changed: 22 additions & 1 deletion b/‎modules/example/src/main/scala/example/api/Repositories.scala
Lines changed: 22 additions & 1 deletion
diff --git a/‎modules/example/zio-elasticsearch-example.postman_collection.json
Lines changed: 36 additions & 0 deletions b/‎modules/example/zio-elasticsearch-example.postman_collection.json
Lines changed: 36 additions & 0 deletions
@@ -129,12 +129,35 @@ ElasticQuery.range(User.age).gte(18).lt(100)
 ZIO Elastic requests like `Create`, `CreateOrUpdate`, `CreateWithId`, and `DeleteById` are bulkable requests.
 For bulkable requests, you can use `bulk` API that accepts request types that inherit the `Bulkable` trait.
 
+When performing bulk operations, you can specify the target index at the request level for each individual operation. 
+However, you can also define a global index for the entire bulk request if all operations within that request target 
+the same index. If a global index is specified for the bulk request, but an individual operation 
+within that same bulk request also explicitly defines its own index, the individual operation's index will take precedence for 
+that specific request.
+
 ```scala
+val indexName: IndexName = IndexName("users-index")
+val specificIndexName: IndexName = IndexName("specific-users-index")
+
+ElasticRequest.bulk(
+  ElasticRequest.create[User](index = indexName, doc = User(1, "John Doe")),
+  ElasticRequest.create[User](index = indexName, id = DocumentId("documentId2"), doc = User(2, "Jane Doe")),
+  ElasticRequest.upsert[User](index = indexName, id = DocumentId("documentId3"), doc = User(3, "Richard Roe")),
+  ElasticRequest.deleteById(index = indexName, id = DocumentId("documentId2"))
+)
+
+ElasticRequest.bulk(
+  index = indexName,
+  ElasticRequest.create[User](doc = User(1, "John Doe")),
+  ElasticRequest.upsert[User](id = DocumentId("documentId2"), doc = User(2, "Jane Doe")),
+  ElasticRequest.deleteById(id = DocumentId("documentId3"))
+)
+
 ElasticRequest.bulk(
-  ElasticRequest.create[User](indexName, User(1, "John Doe")),
-  ElasticRequest.create[User](indexName, DocumentId("documentId2"), User(2, "Jane Doe")),
-  ElasticRequest.upsert[User](indexName, DocumentId("documentId3"), User(3, "Richard Roe")),
-  ElasticRequest.deleteById(indexName, DocumentId("documentId2"))
+  index = indexName, 
+  ElasticRequest.create[User](doc = User(20, "Eve")), 
+  ElasticRequest.upsert[User](index = specificIndexName, id = DocumentId("docId4"), doc = User(21, "Charlie")), 
+  ElasticRequest.deleteById(id = DocumentId("docId5"))
 )
 ```
 
 
@@ -0,0 +1,40 @@
+---
+id: elastic_aggregation_sampler
+title: "Sampler Aggregation"
+---
+The Sampler aggregation is a single-bucket aggregation that returns a sample of the documents that fall into the aggregation scope. This aggregation is
+particularly useful when you want to run sub-aggregations on a representative sample of documents rather than on the entire dataset.
+
+To use the `Sampler` aggregation, import the following:
+```scala
+import zio.elasticsearch.aggregation.SamplerAggregation
+import zio.elasticsearch.ElasticAggregation.samplerAggregation
+```
+
+A Sampler aggregation must always have at least one sub-aggregation.
+You can create a Sampler aggregation with an initial sub-aggregation using the `samplerAggregation` method this way:
+```scala
+import zio.elasticsearch.ElasticAggregation.avgAggregation
+val aggregation: SamplerAggregation = samplerAggregation(
+  name = "samplerAggregation", 
+  subAgg = avgAggregation(name = "avgRating", field = Document.intField)
+)
+```
+
+If you want to add another sub-aggregation, you can use `withSubAgg` method:
+```scala
+val aggregationWithMultipleSubAggs: SamplerAggregation = samplerAggregation(
+  name = "termsAggregation", 
+  field = Document.stringField
+).withSubAgg(maxAggregation(name = "maxAggregation", field = Document.intField))
+```
+By default, the `shard_size` parameter for a Sampler aggregation is set to 100. This means that each shard will return a maximum of 100 documents to be 
+sampled.
+If you want to change the `shard_size`, you can use the `maxDocumentsPerShard` method:
+```scala
+val aggregationWithShardSize: SamplerAggregation = samplerAggregation(
+  name = "samplerAggregation",
+  subAgg = avgAggregation(name = "avgRating", field = Document.intField)
+).maxDocumentsPerShard(500)
+```
+You can find more detailed information about the `Sampler` aggregation in the official Elasticsearch documentation [here](https://www.elastic.co/docs/reference/aggregations/search-aggregations-bucket-sampler-aggregation).
@@ -9,34 +9,58 @@ In order to use the `Bulk` request import the following:
 ```scala
 import zio.elasticsearch.ElasticRequest.BulkRequest
 import zio.elasticsearch.ElasticRequest.bulk
+// this import is required for using `IndexName` and `DocumentId`
+import zio.elasticsearch._
 ```
 
-You can create a `Bulk` request using the `bulk` method this way:
+You can create a `Bulk` request using the `bulk` method, which offers two main ways to handle indices:
+1. With a global index:
+This approach is ideal when most (or all) of your bulk operations target the same index. You provide a default index for the entire bulk request as 
+the first argument. Any individual operation within this `bulk` request that doesn't explicitly specify its own index will automatically use this 
+global index.
+_**Important: If an individual operation does specify its own index, that individual index will always take precedence over the global one for that 
+specific operation.**_
 ```scala
-// this import is required for using `IndexName` and `DocumentId`
-import zio.elasticsearch._
+val index = IndexName("my-global-index")
 
-val index = Index("index")
+val document1 = new Document(id = DocumentId("111"), intField = 1, stringField = "stringField1")
+val document2 = new Document(id = DocumentId("222"), intField = 2, stringField = "stringField2")
+
+val request: BulkRequest = bulk(
+index = index,
+requests = create(doc = document1),
+upsert(id = DocumentId("111"), doc = document2)
+)
+```
+2. Without a global index:
+Choose this method when your bulk operations frequently target different indices, or when you prefer to explicitly define the index for every single 
+operation. When using this variant, each individual `BulkableRequest` must specify its own index.
+```scala
+val index1 = IndexName("first-index")
+val index2 = IndexName("second-index")
 
 val document1 = new Document(id = DocumentId("111"), intField = 1, stringField = "stringField1")
 val document2 = new Document(id = DocumentId("222"), intField = 2, stringField = "stringField2")
 
-val request: BulkRequest = bulk(create(index = index, doc = document1), upsert(index = index, id = DocumentId("111"), doc = document2))
+val request: BulkRequest = bulk(
+  requests = create(index = index1, doc = document1),
+  upsert(index = index2, id = DocumentId("111"), doc = document2)
+)
 ```
 
 If you want to change the `refresh`, you can use `refresh`, `refreshFalse` or `refreshTrue` method:
 ```scala
-val requestWithRefresh: BulkRequest = bulk(create(index = index, doc = document1), upsert(index = index, id = DocumentId("111"), doc = document2)).refresh(true)
-val requestWithRefreshFalse: BulkRequest = bulk(create(index = index, doc = document1), upsert(index = index, id = DocumentId("111"), doc = document2)).refreshFalse
-val requestWithRefreshTrue: BulkRequest = bulk(create(index = index, doc = document1), upsert(index = index, id = DocumentId("111"), doc = document2)).refreshTrue
+val requestWithRefresh: BulkRequest = bulk(requests = create(index = index, doc = document1), upsert(index = index, id = DocumentId("111"), doc = document2)).refresh(true)
+val requestWithRefreshFalse: BulkRequest = bulk(requests = create(index = index, doc = document1), upsert(index = index, id = DocumentId("111"), doc = document2)).refreshFalse
+val requestWithRefreshTrue: BulkRequest = bulk(requests = create(index = index, doc = document1), upsert(index = index, id = DocumentId("111"), doc = document2)).refreshTrue
 ```
 
 If you want to change the `routing`, you can use the `routing` method:
 ```scala
 // this import is required for using `Routing` also
 import zio.elasticsearch._
 
-val requestWithRouting: BulkRequest = bulk(create(index = index, doc = document1), upsert(index = index, id = DocumentId("111"), doc = document2)).routing(Routing("routing"))
+val requestWithRouting: BulkRequest = bulk(requests = create(index = index, doc = document1), upsert(index = index, id = DocumentId("111"), doc = document2)).routing(Routing("routing"))
 ```
 
 You can find more information about `Bulk` request [here](https://www.elastic.co/guide/en/elasticsearch/reference/7.17/docs-bulk.html).
@@ -55,6 +55,13 @@ final case class RepositoriesElasticsearch(elasticsearch: Elasticsearch) {
            )
     } yield ()
 
+  def upsertBulk(organization: String, repositories: Chunk[GitHubRepo]): Task[Unit] =
+    for {
+      routing     <- routingOf(organization)
+      bulkRequests = repositories.map(repo => ElasticRequest.upsert(DocumentId(repo.id), repo).routing(routing))
+      _           <- elasticsearch.execute(ElasticRequest.bulk(Index, bulkRequests: _*))
+    } yield ()
+
   def upsert(id: String, repository: GitHubRepo): Task[Unit] =
     for {
       routing <- routingOf(repository.organization)
@@ -74,7 +81,6 @@ final case class RepositoriesElasticsearch(elasticsearch: Elasticsearch) {
 
   private def routingOf(value: String): IO[IllegalArgumentException, Routing.Type] =
     Routing.make(value).toZIO.mapError(e => new IllegalArgumentException(e))
-
 }
 
 object RepositoriesElasticsearch {
@@ -91,6 +97,9 @@ object RepositoriesElasticsearch {
   def createAll(repositories: Chunk[GitHubRepo]): RIO[RepositoriesElasticsearch, Unit] =
     ZIO.serviceWithZIO[RepositoriesElasticsearch](_.createAll(repositories))
 
+  def upsertBulk(organization: String, repositories: Chunk[GitHubRepo]): RIO[RepositoriesElasticsearch, Unit] =
+    ZIO.serviceWithZIO[RepositoriesElasticsearch](_.upsertBulk(organization, repositories))
+
   def upsert(id: String, repository: GitHubRepo): RIO[RepositoriesElasticsearch, Unit] =
     ZIO.serviceWithZIO[RepositoriesElasticsearch](_.upsert(id, repository))
 
 
@@ -17,7 +17,6 @@
 package example.api
 
 import example.{GitHubRepo, RepositoriesElasticsearch}
-import zio.ZIO
 import zio.elasticsearch._
 import zio.elasticsearch.query.ElasticQuery
 import zio.elasticsearch.request.{CreationOutcome, DeletionOutcome}
@@ -29,7 +28,9 @@ import zio.http.Status.{
 }
 import zio.http.{Method, _}
 import zio.json.EncoderOps
+import zio.schema.Schema
 import zio.schema.codec.JsonCodec.{Configuration => JsonCodecConfig, JsonDecoder}
+import zio.{Chunk, ZIO}
 
 import CompoundOperator._
 import FilterOperator._
@@ -69,6 +70,26 @@ object Repositories {
               }
           }
       }.orDie,
+      Method.POST / BasePath / string("organization") / "bulk-upsert" -> handler {
+        (organization: String, req: Request) =>
+          req.body.asString
+            .map(JsonDecoder.decode[Chunk[GitHubRepo]](Schema.chunk(GitHubRepo.schema), _, JsonCodecConfig.default))
+            .flatMap {
+              case Left(jsonError) =>
+                ZIO.succeed(Response.json(ErrorResponse.fromReasons(jsonError.message).toJson).status(HttpBadRequest))
+              case Right(repositories) =>
+                RepositoriesElasticsearch
+                  .upsertBulk(organization, repositories)
+                  .map(_ => Response.status(HttpNoContent))
+                  .catchAll(e =>
+                    ZIO.succeed(
+                      Response
+                        .json(ErrorResponse.fromReasons(s"Bulk operation failed: ${e.getMessage}").toJson)
+                        .status(HttpBadRequest)
+                    )
+                  )
+            }
+      }.orDie,
       Method.POST / BasePath / "search" -> handler { (req: Request) =>
         req.body.asString
           .map(JsonDecoder.decode[Criteria](Criteria.schema, _, JsonCodecConfig.default))
 
@@ -57,6 +57,42 @@
 				}
 			]
 		},
+		{
+			"name": "Bulk Upsert Repositories",
+			"request": {
+				"method": "POST",
+				"header": [
+					{
+						"key": "Content-Type",
+						"value": "application/json"
+					}
+				],
+				"body": {
+					"mode": "raw",
+					"raw": "[\n    {\n        \"id\": \"repo-bulk-1\",\n        \"organization\": \"lambdaworks\",\n        \"name\": \"bulk-repo-one\",\n        \"url\": \"https://github.com/lambdaworks/bulk-repo-one\",\n        \"description\": \"First repository added via bulk upsert.\",\n        \"lastCommitAt\": \"2023-01-01T10:00:00.000\",\n        \"stars\": 100,\n        \"forks\": 10\n    },\n    {\n        \"id\": \"repo-bulk-2\",\n        \"organization\": \"lambdaworks\",\n        \"name\": \"bulk-repo-two\",\n        \"url\": \"https://github.com/lambdaworks/bulk-repo-two\",\n        \"description\": \"Second repository added via bulk upsert.\",\n        \"lastCommitAt\": \"2023-01-02T11:00:00.000\",\n        \"stars\": 200,\n        \"forks\": 20\n    },\n    {\n        \"id\": \"1234567\",\n        \"organization\": \"lambdaworks\",\n        \"name\": \"scurl-detector-updated\",\n        \"url\": \"https://github.com/lambdaworks/scurl-detector\",\n        \"description\": \"Scala library that detects and extracts URLs from text (UPDATED via bulk).\",\n        \"lastCommitAt\": \"2023-01-03T12:00:00.000\",\n        \"stars\": 150,\n        \"forks\": 15\n    }\n]",
+					"options": {
+						"raw": {
+							"language": "json"
+						}
+					}
+				},
+				"url": {
+					"raw": "http://localhost:{{HTTP_PORT}}/api/repositories/lambdaworks/bulk-upsert",
+					"protocol": "http",
+					"host": [
+						"localhost"
+					],
+					"port": "{{HTTP_PORT}}",
+					"path": [
+						"api",
+						"repositories",
+						"lambdaworks",
+						"bulk-upsert"
+					]
+				}
+			},
+			"response": []
+		},
 		{
 			"name": "Checking app health",
 			"request": {