anthropics / beam
File Size

The distribution of size of files (measured in lines of code).

Intro
Learn more...
File Size Overall
20% | 14% | 27% | 17% | 20%
Legend:
1001+
501-1000
201-500
101-200
1-100


explore: grouped by folders | grouped by size | sunburst | 3D view
File Size per Extension
1001+
501-1000
201-500
101-200
1-100
java13% | 15% | 29% | 20% | 21%
go35% | 14% | 20% | 14% | 14%
py25% | 20% | 30% | 12% | 10%
ts46% | 6% | 23% | 14% | 8%
yaml44% | 10% | 10% | 5% | 29%
proto46% | 24% | 16% | 5% | 7%
dart11% | 2% | 18% | 16% | 50%
groovy58% | 0% | 13% | 15% | 13%
kts0% | 31% | 44% | 16% | 7%
ftl0% | 100% | 0% | 0% | 0%
scss0% | 0% | 42% | 36% | 21%
html0% | 0% | 30% | 14% | 55%
tsx0% | 0% | 55% | 16% | 27%
js0% | 0% | 30% | 39% | 30%
pyi0% | 0% | 100% | 0% | 0%
xml0% | 0% | 51% | 0% | 48%
ipynb0% | 0% | 59% | 40% | 0%
sql0% | 0% | 4% | 15% | 79%
pyx0% | 0% | 0% | 61% | 38%
pxd0% | 0% | 0% | 42% | 57%
css0% | 0% | 0% | 68% | 31%
sass0% | 0% | 0% | 35% | 64%
kt0% | 0% | 0% | 0% | 100%
tpl0% | 0% | 0% | 0% | 100%
hcl0% | 0% | 0% | 0% | 100%
toml0% | 0% | 0% | 0% | 100%
ps10% | 0% | 0% | 0% | 100%
h0% | 0% | 0% | 0% | 100%
cfg0% | 0% | 0% | 0% | 100%
rdf0% | 0% | 0% | 0% | 100%
in0% | 0% | 0% | 0% | 100%
scala0% | 0% | 0% | 0% | 100%
File Size per Logical Decomposition
primary
1001+
501-1000
201-500
101-200
1-100
sdks23% | 17% | 27% | 16% | 16%
runners9% | 13% | 32% | 22% | 22%
playground32% | 6% | 16% | 14% | 30%
learning11% | 5% | 6% | 14% | 61%
model55% | 13% | 16% | 6% | 8%
buildSrc71% | 0% | 16% | 4% | 7%
website8% | 3% | 32% | 25% | 30%
infra21% | 28% | 38% | 9% | 2%
ROOT0% | 61% | 27% | 9% | 1%
it0% | 0% | 41% | 28% | 29%
.test-infra0% | 0% | 45% | 16% | 38%
scripts0% | 0% | 39% | 43% | 16%
release0% | 0% | 21% | 49% | 28%
contributor-docs0% | 0% | 0% | 100% | 0%
.github0% | 0% | 0% | 0% | 100%
plugins0% | 0% | 0% | 0% | 100%
.gemini0% | 0% | 0% | 0% | 100%
Longest Files (Top 50)
File# lines# units
register.go
in sdks/go/pkg/beam/register
7254 504
go.g.yaml
in playground/frontend/playground_components/assets/symbols
6641 -
beam_fn_api.pb.go
in sdks/go/pkg/beam/model/fnexecution_v1
5486 545
beam_runner_api.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/pipeline/v1
5095 102
frames.py
in sdks/python/apache_beam/dataframe
4173 191
beam_fn_api.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/fn_execution/v1
3456 67
api.pb.go
in learning/tour-of-beam/backend/playground_api/api/v1
3333 339
api.pb.go
in playground/backend/internal/api/v1
3333 339
BigQueryIO.java
in sdks/java/io/google-cloud-platform/src/main/java/org/apache/beam/sdk/io/gcp/bigquery
2664 168
FnApiDoFnRunner.java
in sdks/java/harness/src/main/java/org/apache/beam/fn/harness
2428 156
core.py
in sdks/python/apache_beam/transforms
2413 286
api.pb.dart
in playground/frontend/playground_components/lib/src/api/v1
2383 113
BeamModulePlugin.groovy
in buildSrc/src/main/groovy/org/apache/beam/gradle
2377 7
dataflow_v1b3_messages.py
in sdks/python/apache_beam/runners/dataflow/internal/clients/dataflow
2358 -
DataflowRunner.java
in runners/google-cloud-dataflow-java/src/main/java/org/apache/beam/runners/dataflow
2215 86
KafkaIO.java
in sdks/java/io/kafka/src/main/java/org/apache/beam/sdk/io/kafka
2191 169
DoFnSignatures.java
in sdks/java/core/src/main/java/org/apache/beam/sdk/transforms/reflect
2091 67
beam_job_api.pb.go
in sdks/go/pkg/beam/model/jobmanagement_v1
2041 194
descriptor.ts
in sdks/typescript/src/apache_beam/proto/google/protobuf
1991 27
bigquery.py
in sdks/python/apache_beam/io/gcp
1953 95
JdbcIO.java
in sdks/java/io/jdbc/src/main/java/org/apache/beam/sdk/io/jdbc
1931 153
decoders.go
in sdks/go/pkg/beam/core/runtime/exec/optimized
1856 441
ElasticsearchIO.java
in sdks/java/io/elasticsearch/src/main/java/org/apache/beam/sdk/io/elasticsearch
1831 174
bundle_processor.py
in sdks/python/apache_beam/runners/worker
1786 128
encoders.go
in sdks/go/pkg/beam/core/runtime/exec/optimized
1772 421
elementmanager.go
in sdks/go/pkg/beam/runners/prism/internal/engine
1756 85
schema.pb.go
in sdks/go/pkg/beam/model/pipeline_v1
1749 181
metrics.pb.go
in sdks/go/pkg/beam/model/pipeline_v1
1734 111
proto
beam_runner_api.proto
in model/pipeline/src/main/proto/org/apache/beam/model/pipeline/v1
1722 -
pipeline_options.py
in sdks/python/apache_beam/options
1719 71
SpannerIO.java
in sdks/java/io/google-cloud-platform/src/main/java/org/apache/beam/sdk/io/gcp/spanner
1709 170
capability_matrix.yaml
in website/www/site/data
1685 -
translations.py
in sdks/python/apache_beam/runners/portability/fn_api_runner
1679 64
BigQueryServicesImpl.java
in sdks/java/io/google-cloud-platform/src/main/java/org/apache/beam/sdk/io/gcp/bigquery
1656 67
DatastoreV1.java
in sdks/java/io/google-cloud-platform/src/main/java/org/apache/beam/sdk/io/gcp/datastore
1645 136
v1.pb.go
in sdks/go/pkg/beam/core/runtime/graphx/v1
1608 148
TableRowToStorageApiProto.java
in sdks/java/io/google-cloud-platform/src/main/java/org/apache/beam/sdk/io/gcp/bigquery
1607 38
FlinkStateInternals.java
in runners/flink/src/main/java/org/apache/beam/runners/flink/translation/wrappers/streaming/state
1587 121
bigquery_v2_messages.py
in sdks/python/apache_beam/io/gcp/internal/clients/bigquery
1582 -
PCollectionViews.java
in sdks/java/core/src/main/java/org/apache/beam/sdk/values
1534 105
PipelineOptionsFactory.java
in sdks/java/core/src/main/java/org/apache/beam/sdk/options
1521 67
calls.go
in sdks/go/pkg/beam/core/util/reflectx
1490 270
beam_artifact_api.pb.go
in sdks/go/pkg/beam/model/jobmanagement_v1
1484 144
BigtableIO.java
in sdks/java/io/google-cloud-platform/src/main/java/org/apache/beam/sdk/io/gcp/bigtable
1473 132
util.py
in sdks/python/apache_beam/transforms
1457 117
coder_impl.py
in sdks/python/apache_beam/coders
1409 191
AvroUtils.java
in sdks/java/extensions/avro/src/main/java/org/apache/beam/sdk/extensions/avro/schemas/utils
1365 75
Combine.java
in sdks/java/core/src/main/java/org/apache/beam/sdk/transforms
1359 160
common.py
in sdks/python/apache_beam/runners
1311 97
bigquery_tools.py
in sdks/python/apache_beam/io/gcp
1267 78
Files With Most Units (Top 50)
File# lines# units
beam_fn_api.pb.go
in sdks/go/pkg/beam/model/fnexecution_v1
5486 545
register.go
in sdks/go/pkg/beam/register
7254 504
decoders.go
in sdks/go/pkg/beam/core/runtime/exec/optimized
1856 441
encoders.go
in sdks/go/pkg/beam/core/runtime/exec/optimized
1772 421
api.pb.go
in learning/tour-of-beam/backend/playground_api/api/v1
3333 339
api.pb.go
in playground/backend/internal/api/v1
3333 339
coders.py
in sdks/python/apache_beam/coders
1101 323
core.py
in sdks/python/apache_beam/transforms
2413 286
calls.go
in sdks/go/pkg/beam/core/util/reflectx
1490 270
trigger.py
in sdks/python/apache_beam/transforms
1162 239
beam_job_api.pb.go
in sdks/go/pkg/beam/model/jobmanagement_v1
2041 194
coder_impl.py
in sdks/python/apache_beam/coders
1409 191
frames.py
in sdks/python/apache_beam/dataframe
4173 191
schema.pb.go
in sdks/go/pkg/beam/model/pipeline_v1
1749 181
ElasticsearchIO.java
in sdks/java/io/elasticsearch/src/main/java/org/apache/beam/sdk/io/elasticsearch
1831 174
SpannerIO.java
in sdks/java/io/google-cloud-platform/src/main/java/org/apache/beam/sdk/io/gcp/spanner
1709 170
KafkaIO.java
in sdks/java/io/kafka/src/main/java/org/apache/beam/sdk/io/kafka
2191 169
BigQueryIO.java
in sdks/java/io/google-cloud-platform/src/main/java/org/apache/beam/sdk/io/gcp/bigquery
2664 168
Combine.java
in sdks/java/core/src/main/java/org/apache/beam/sdk/transforms
1359 160
FnApiDoFnRunner.java
in sdks/java/harness/src/main/java/org/apache/beam/fn/harness
2428 156
JdbcIO.java
in sdks/java/io/jdbc/src/main/java/org/apache/beam/sdk/io/jdbc
1931 153
v1.pb.go
in sdks/go/pkg/beam/core/runtime/graphx/v1
1608 148
beam_artifact_api.pb.go
in sdks/go/pkg/beam/model/jobmanagement_v1
1484 144
cells.py
in sdks/python/apache_beam/metrics
648 143
Schema.java
in sdks/java/core/src/main/java/org/apache/beam/sdk/schemas
1089 143
base.py
in sdks/python/apache_beam/ml/inference
1170 142
AvroIO.java
in sdks/java/extensions/avro/src/main/java/org/apache/beam/sdk/extensions/avro/io
1177 138
SimpleDoFnRunner.java
in runners/core-java/src/main/java/org/apache/beam/runners/core
1254 137
DatastoreV1.java
in sdks/java/io/google-cloud-platform/src/main/java/org/apache/beam/sdk/io/gcp/datastore
1645 136
yaml_provider.py
in sdks/python/apache_beam/yaml
1141 134
BigtableIO.java
in sdks/java/io/google-cloud-platform/src/main/java/org/apache/beam/sdk/io/gcp/bigtable
1473 132
typehints.py
in sdks/python/apache_beam/typehints
920 130
combiners.py
in sdks/python/apache_beam/transforms
731 129
PAssert.java
in sdks/java/core/src/main/java/org/apache/beam/sdk/testing
1179 129
bundle_processor.py
in sdks/python/apache_beam/runners/worker
1786 128
schemas.py
in sdks/python/apache_beam/typehints
846 127
FlinkStateInternals.java
in runners/flink/src/main/java/org/apache/beam/runners/flink/translation/wrappers/streaming/state
1587 121
util.py
in sdks/python/apache_beam/transforms
1457 117
iobase.py
in sdks/python/apache_beam/io
750 113
api.pb.dart
in playground/frontend/playground_components/lib/src/api/v1
2383 113
metrics.pb.go
in sdks/go/pkg/beam/model/pipeline_v1
1734 111
callers.go
in sdks/go/pkg/beam/core/runtime/exec/optimized
470 111
WindowedValues.java
in sdks/java/core/src/main/java/org/apache/beam/sdk/values
916 110
SnowflakeIO.java
in sdks/java/io/snowflake/src/main/java/org/apache/beam/sdk/io/snowflake
1169 109
WatermarkManager.java
in runners/direct-java/src/main/java/org/apache/beam/runners/direct
1165 106
TextIO.java
in sdks/java/core/src/main/java/org/apache/beam/sdk/io
806 105
PCollectionViews.java
in sdks/java/core/src/main/java/org/apache/beam/sdk/values
1534 105
beam_runner_api.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/pipeline/v1
5095 102
worker_handlers.py
in sdks/python/apache_beam/runners/portability/fn_api_runner
934 99
operations.py
in sdks/python/apache_beam/runners/worker
1028 99
Files With Long Lines (Top 50)

There are 523 files with lines longer than 120 characters. In total, there are 5228 long lines.

File# lines# units# long lines
register.go
in sdks/go/pkg/beam/register
7254 504 874
beam_runner_api.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/pipeline/v1
5095 102 384
beam_fn_api.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/fn_execution/v1
3456 67 299
api.pb.dart
in playground/frontend/playground_components/lib/src/api/v1
2383 113 253
beam_fn_api.pb.go
in sdks/go/pkg/beam/model/fnexecution_v1
5486 545 152
descriptor.ts
in sdks/typescript/src/apache_beam/proto/google/protobuf
1991 27 137
beam-codestyle.xml
in sdks/java/build-tools/src/main/resources/beam
313 - 101
beam_artifact_api.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/job_management/v1
994 19 81
beam_job_api.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/job_management/v1
1193 24 80
schema.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/pipeline/v1
1175 18 75
api_grpc.pb.go
in learning/tour-of-beam/backend/playground_api/api/v1
736 62 73
api_grpc.pb.go
in playground/backend/internal/api/v1
736 62 73
BeamModulePlugin.groovy
in buildSrc/src/main/groovy/org/apache/beam/gradle
2377 7 70
controller.go
in playground/backend/cmd/server
517 21 61
mock.go
in learning/tour-of-beam/backend/playground_api/api/v1
811 40 56
beam_job_api.grpc-client.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/job_management/v1
107 1 56
api.pbjson.dart
in playground/frontend/playground_components/lib/src/api/v1
468 - 51
beam_job_api.pb.go
in sdks/go/pkg/beam/model/jobmanagement_v1
2041 194 49
calls.go
in sdks/go/pkg/beam/core/util/reflectx
1490 270 45
elementmanager.go
in sdks/go/pkg/beam/runners/prism/internal/engine
1756 85 42
beam_artifact_api.grpc-client.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/job_management/v1
107 4 38
beam_fn_api.grpc-client.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/fn_execution/v1
132 6 36
capability_matrix.yaml
in website/www/site/data
1685 - 36
api.pb.go
in learning/tour-of-beam/backend/playground_api/api/v1
3333 339 34
api.pb.go
in playground/backend/internal/api/v1
3333 339 34
beam_artifact_api.pb.go
in sdks/go/pkg/beam/model/jobmanagement_v1
1484 144 33
beam_artifact_api_grpc.pb.go
in sdks/go/pkg/beam/model/jobmanagement_v1
457 45 31
beam_job_api_grpc.pb.go
in sdks/go/pkg/beam/model/jobmanagement_v1
453 40 31
capability_matrix_snapshot.yaml
in website/www/site/data
733 - 30
standard_coders.yaml
in model/fn-execution/src/main/resources/org/apache/beam/model/fnexecution/v1
395 - 29
schema.pb.go
in sdks/go/pkg/beam/model/pipeline_v1
1749 181 27
fn.go
in sdks/go/pkg/beam/core/graph
1247 65 27
api.pbenum.dart
in playground/frontend/playground_components/lib/src/api/v1
93 - 25
stage.go
in sdks/go/pkg/beam/runners/prism/internal
631 9 24
worker.go
in sdks/go/pkg/beam/runners/prism/internal/worker
699 34 24
sdks.html
in website/www/site/layouts/partials/section-menu/en
161 - 24
code_processing.go
in playground/backend/internal/code_processing
497 27 24
beam_provision_api.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/fn_execution/v1
212 4 23
metrics.pb.go
in sdks/go/pkg/beam/model/pipeline_v1
1734 111 22
statemgr.go
in sdks/go/pkg/beam/core/runtime/harness
588 37 22
account_keys.py
in infra/enforcement
302 16 21
beam_fn_api_grpc.pb.go
in sdks/go/pkg/beam/model/fnexecution_v1
570 62 21
flink_python_pipeline_options.html
in website/www/site/layouts/shortcodes
202 - 21
flink_java_pipeline_options.html
in website/www/site/layouts/shortcodes
202 - 21
header.html
in website/www/site/layouts/partials
238 - 21
generate_event.py
in learning/katas/python/Streaming/Triggers/Early Triggers
37 2 20
generate_event.py
in learning/katas/python/Streaming/Triggers/Window Accumulation Modes
37 2 20
generate_event.py
in learning/katas/python/Streaming/Triggers/Event Time Triggers
37 2 20
metrics.ts
in sdks/typescript/src/apache_beam/proto/org/apache/beam/model/pipeline/v1
379 7 20
dataflow.go
in sdks/go/pkg/beam/runners/dataflow
377 10 19