Scanning over a Store

The Scan family of APIs are very similar to List but they allow you to list Items across your entire Store. This can be useful scenarios such as:

Migrations and backfills that need to operate on every Item
Custom exporters to other datastores
Auditing/validation workflows
Deleting unwanted data
Building global aggregations (e.g. compute the top X blog posts by comments, or counting the number of items meeting some criteria)

Be warned that these operations can be slow and expensive, especially on large Stores. You should use them sparingly and consider using List instead if you can. These results of a Scan operation are not guaranteed to be in any particular order and Items with multiple key paths will only be returned once with their primary key path.

Beginning a Scan

Just like for a List operation, you begin by calling BeginScan, with your desired parameters. Then you can continue to retrieve more Items by calling ContinueScan with the token returned by BeginScan.

For this example we’ll use the schema defined in Example: Movies Schema, which defines these key paths (among others):

Item Type	Key Path Template
Movie	`/movie-:id`
Actor	`/actor-:id`


17 collapsed lines
1
package main
2

3
import (
4
  "context"
5
  "fmt"
6
  "os"
7
  "slices"
8
  "strconv"
9
  "time"
10

11
  "github.com/google/uuid"
12

13
  "github.com/StatelyCloud/go-sdk/stately"
14
  // This is the code you generated from schema
15
  "github.com/StatelyCloud/stately/go-sdk-sample/schema"
16
)
17

18
func sampleScan(
19
  ctx context.Context,
20
  client stately.Client,
21
) (*stately.ListToken, error) {
22
  iter, err := client.BeginScan(
23
    ctx,
24
    stately.ScanOptions{ItemTypes: []string{"Movie", "Actor"}},
25
  )
26
  if err != nil {
27
    return nil, err
28
  }
29

30
  for iter.Next() {
31
    item := iter.Value()
32
    switch v := item.(type) {
33
    case *schema.Movie:
34
      fmt.Printf("Movie Title: %s\n", v.GetTitle())
35
    case *schema.Actor:
36
      fmt.Printf("Actor Name: %s\n", v.GetName())
37
    }
38
  }
39
  // When we've exhausted the iterator, we'll get a token that we
40
  // can use to fetch the next page of items.
41
  return iter.Token()
42
}


5 collapsed lines
1
require 'bundler/setup'
2
require_relative 'schema/stately'
3
require 'byebug'
4

5

6
def sample_scan(client)
7
  begin_scan_result, token = client.begin_scan(item_types: ['Movie', 'Actor'])
8

9
  begin_scan_result.each do |item|
10
    case item
11
    when StatelyDB::Types::Movie
12
      puts "[Movie] title: #{item.title}"
13
    when StatelyDB::Types::Actor
14
      puts "[Actor] name: #{item.name}"
15
    end
16
  end
17

18
  return token
19
end


9 collapsed lines
1
from __future__ import annotations
2

3
from typing import TYPE_CHECKING
4

5
from statelydb import ListToken, SyncChangedItem, SyncDeletedItem, SyncReset, key_path
6

7
from .schema import Actor, Change, Character, Client, Movie
8

9

10
async def sample_scan(client: Client) -> None:
11
    scan_resp = await client.begin_scan(item_types=[Movie, Actor])
12

13
    async for item in scan_resp:
14
        if isinstance(item, Movie):
15
            print(f"[Movie] title: {item.title}")
16
        elif isinstance(item, Actor):
17
            print(f"[Actor] name: {item.name}")
18

19
    # When we've exhausted the iterator, we'll get a token that we can
20
    # use to fetch the next page of items.
21
    return scan_resp.token


3 collapsed lines
1
import { createClient, DatabaseClient, Movie } from "./schema/index.js";
2
import { keyPath, ListToken } from "@stately-cloud/client";
3

4
async function sampleScan(client: DatabaseClient): Promise<ListToken> {
5
  let iter = client.beginScan({
6
    itemTypes: ["Movie", "Actor"],
7
  });
8
  for await (const item of iter) {
9
    if (client.isType(item, "Movie")) {
10
      console.log("Movie:", item.title);
11
    } else if (client.isType(item, "Actor")) {
12
      console.log("Actor:", item.name);
13
    }
14
  }
15
  return iter.token!;
16
}

1
stately item scan \
2
  --store-id <store-id-goes-here> \
3
  --item-types Movie,Actor

Using the List Token to Continue

The result from BeginScan includes a list token which you can use to continue in the ContinueScan. Read more about list tokens in Using the List Token to Continue. token.canSync will always be set to false for Scan operations.


17 collapsed lines
1
package main
2

3
import (
4
  "context"
5
  "fmt"
6
  "os"
7
  "slices"
8
  "strconv"
9
  "time"
10

11
  "github.com/google/uuid"
12

13
  "github.com/StatelyCloud/go-sdk/stately"
14
  // This is the code you generated from schema
15
  "github.com/StatelyCloud/stately/go-sdk-sample/schema"
16
)
17

18
func sampleContinueScan(
19
  ctx context.Context,
20
  client stately.Client,
21
  token *stately.ListToken,
22
) (*stately.ListToken, error) {
23
  iter, err := client.ContinueScan(ctx, token.Data)
24
  if err != nil {
25
    return nil, err
26
  }
27
  for iter.Next() {
28
    item := iter.Value()
29
    switch v := item.(type) {
30
    case *schema.Character:
31
      fmt.Printf("Character Name: %s\n", v.GetName())
32
    case *schema.Actor:
33
      fmt.Printf("Actor Name: %s\n", v.GetName())
34
    }
35
  }
36
  // You could save the token to call ContinueScan later.
37
  return iter.Token()
38
}


5 collapsed lines
1
require 'bundler/setup'
2
require_relative 'schema/stately'
3
require 'byebug'
4

5

6
def sample_continue_list(client, token)
7
  # Fetch the next page of items
8
  continue_scan_result, token = client.continue_scan(token)
9

10
  continue_scan_result.each do |item|
11
    case item
12
    when StatelyDB::Types::Movie
13
      puts "[Movie] title: #{item.title}"
14
    when StatelyDB::Types::Actor
15
      puts "[Actor] name: #{item.name}"
16
    end
17
  end
18

19
  # You could save the token to call ContinueScan later.
20
  return token
21
end


9 collapsed lines
1
from __future__ import annotations
2

3
from typing import TYPE_CHECKING
4

5
from statelydb import ListToken, SyncChangedItem, SyncDeletedItem, SyncReset, key_path
6

7
from .schema import Actor, Change, Character, Client, Movie
8

9

10
async def sample_continue_scan(client: Client, token: str) -> ListToken:
11
    # Fetch the next page of items
12
    continue_scan_result = await client.continue_scan(token)
13

14
    # Print out the paths of the next batch of listed items
15
    async for item in continue_scan_result:
16
        if isinstance(item, Movie):
17
            print(f"[Movie] title: {item.title}")
18
        elif isinstance(item, Actor):
19
            print(f"[Actor] name: {item.name}")
20

21
    # You could save the token to call ContinueScan later.
22
    return continue_scan_result.token


3 collapsed lines
1
import { createClient, DatabaseClient, Movie } from "./schema/index.js";
2
import { keyPath, ListToken } from "@stately-cloud/client";
3

4
async function sampleContinueScan(
5
  client: DatabaseClient,
6
  token: ListToken,
7
): Promise<ListToken> {
8
  // You can call `collect` on the iterator to pull
9
  // all the items into an Array.
10
  const { items, token: newToken } = await client
11
    .continueScan(token)
12
    .collect();
13

14
  for (const item of items) {
15
    if (client.isType(item, "Movie")) {
16
      console.log("Movie:", item.title);
17
    } else if (client.isType(item, "Actor")) {
18
      console.log("Actor:", item.name);
19
    }
20
  }
21
  // You could save the token to call ContinueScan later.
22
  return newToken;
23
}

Filtering

You can pass a filter to BeginScan to only retrieve Items that match the filter. We currently support filtering by Item Type.

Limits

Pass a limit to BeginScan to limit the max number of items to retrieve. If limit is set to 0 then the first page of results will be returned which may be empty because all the results were filtered out. Be sure to check token.canContinue to see if there are more results to fetch.

Segmentation

Because a Scan operation can be slow and expensive, you can segment the operation into smaller chunks by passing a totalSegments and segmentIndex parameter to BeginScan. This will allow you to run multiple Scan operations in parallel, each responsible for a different segment of the Store. You can split your scan into up to 1000000 segments.

Listing Across Client Upgrades

Just like for List operations, you are not able to use a list token across client versions.