Skip to content

Commit

Permalink
Merge branch 'main' of github.com:mikegre-google/maxtext
Browse files Browse the repository at this point in the history
  • Loading branch information
mikegre-google committed Apr 12, 2024
2 parents c822cea + 6094542 commit 9ee125e
Show file tree
Hide file tree
Showing 42 changed files with 29 additions and 1,025 deletions.
8 changes: 4 additions & 4 deletions .github/workflows/UnitTests.yml
Original file line number Diff line number Diff line change
Expand Up @@ -106,19 +106,19 @@ jobs:
- name: Test generate_param_only_checkpoint
run: |
docker run -v /home/runner/actions-runner/_work/maxtext/maxtext:/app --rm --privileged maxtext_base_image bash -c \
'bash end_to_end/test_generate_param_only_checkpoint.sh -r runner_$(date +%Y-%m-%d-%H-%M)-${RANDOM} -o gs://runner-maxtext-logs -d gs://maxtext-dataset -i 4'
'bash end_to_end/tpu/test_generate_param_only_checkpoint.sh -r runner_$(date +%Y-%m-%d-%H-%M)-${RANDOM} -o gs://runner-maxtext-logs -d gs://maxtext-dataset -i 4'
- name: Test generate_param_only_checkpoint with int8 quantization
run: |
docker run -v /home/runner/actions-runner/_work/maxtext/maxtext:/app --rm --privileged maxtext_base_image bash -c \
'bash end_to_end/test_generate_param_only_checkpoint.sh -r runner_$(date +%Y-%m-%d-%H-%M)-${RANDOM} -o gs://runner-maxtext-logs -d gs://maxtext-dataset -i 4 -q int8'
'bash end_to_end/tpu/test_generate_param_only_checkpoint.sh -r runner_$(date +%Y-%m-%d-%H-%M)-${RANDOM} -o gs://runner-maxtext-logs -d gs://maxtext-dataset -i 4 -q int8'
- name: Test grain checkpoint determinism
run: |
docker run -v /home/runner/actions-runner/_work/maxtext/maxtext:/app --rm --privileged maxtext_base_image bash -c \
'bash end_to_end/test_checkpointing.sh runner gs://runner-maxtext-logs gs://maxtext-dataset False c4-array_record'
'bash end_to_end/tpu/test_checkpointing.sh runner gs://runner-maxtext-logs gs://maxtext-dataset False c4-array_record'
- name: Test checkpoint compatibility
run: |
docker run -v /home/runner/actions-runner/_work/maxtext/maxtext:/app --rm --privileged maxtext_base_image bash -c \
'bash end_to_end/test_checkpoint_compatibility.sh runner gs://runner-maxtext-logs gs://maxtext-dataset'
'bash end_to_end/tpu/test_checkpoint_compatibility.sh runner gs://runner-maxtext-logs gs://maxtext-dataset'
- name: Validate Pedagogical Example, Shmap_collective_matmul
run: |
docker run -v /home/runner/actions-runner/_work/maxtext/maxtext:/app --rm --privileged maxtext_base_image bash -c \
Expand Down
6 changes: 3 additions & 3 deletions MaxText/layers/embeddings.py
Original file line number Diff line number Diff line change
Expand Up @@ -164,8 +164,8 @@ def __call__(
)
position = position[:, :, jnp.newaxis, jnp.newaxis]
sinusoid_inp = position / timescale
sin = jnp.sin(sinusoid_inp)
cos = jnp.cos(sinusoid_inp)
sin = jnp.sin(sinusoid_inp).astype(inputs.dtype)
cos = jnp.cos(sinusoid_inp).astype(inputs.dtype)
first_half, second_half = jnp.split(inputs, 2, axis=-1)
first_part = first_half * cos - second_half * sin
second_part = second_half * cos + first_half * sin
Expand Down Expand Up @@ -198,4 +198,4 @@ def __call__(
signal = jnp.concatenate([jnp.sin(scaled_time), jnp.cos(scaled_time)], axis = -1)
# signal = jnp.pad(signal, [[0, jnp.mod(self.embedding_dims, 2)]])
position_embedding = signal.astype(jnp.float32)
return input_embedding + position_embedding
return input_embedding + position_embedding
1 change: 0 additions & 1 deletion MaxText/tests/train_gpu_smoke_test.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,6 @@ class Train(unittest.TestCase):

def test_tiny_config(self):
test_tmpdir = os.environ.get("TEST_TMPDIR")
os.environ["TENSORBOARD_PROJECT"] = "test-project"
train_main([
None,
"third_party/py/maxtext/configs/gpu_smoke_test.yml",
Expand Down
1 change: 0 additions & 1 deletion MaxText/tests/train_int8_smoke_test.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,6 @@ class Train(unittest.TestCase):

def test_tiny_config(self):
test_tmpdir = os.environ.get("TEST_TMPDIR")
os.environ["TENSORBOARD_PROJECT"] = "test-project"
train_main([None, "third_party/py/maxtext/configs/base.yml",
f"base_output_directory=gs://runner-maxtext-logs", "run_name=runner_test",
r"dataset_path=gs://maxtext-dataset",
Expand Down
1 change: 0 additions & 1 deletion MaxText/tests/train_smoke_test.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,6 @@ class Train(unittest.TestCase):

def test_tiny_config(self):
test_tmpdir = os.environ.get("TEST_TMPDIR")
os.environ["TENSORBOARD_PROJECT"] = "test-project"
train_main([None, "third_party/py/maxtext/configs/base.yml",
f"base_output_directory=gs://runner-maxtext-logs", "run_name=runner_test",
r"dataset_path=gs://maxtext-dataset",
Expand Down
3 changes: 2 additions & 1 deletion MaxText/train.py
Original file line number Diff line number Diff line change
Expand Up @@ -508,7 +508,8 @@ def main(argv: Sequence[str]) -> None:
validate_train_config(config)
os.environ["TFDS_DATA_DIR"] = config.dataset_path
vertex_tensorboard_manager = VertexTensorboardManager()
vertex_tensorboard_manager.configure_vertex_tensorboard(config)
if config.use_vertex_tensorboard or os.environ.get("UPLOAD_DATA_TO_TENSORBOARD"):
vertex_tensorboard_manager.configure_vertex_tensorboard(config)

debug_config = debug_configuration.DebugConfig(
stack_trace_config = stack_trace_configuration.StackTraceConfig(
Expand Down
139 changes: 0 additions & 139 deletions end_to_end/eval_assert.py

This file was deleted.

64 changes: 0 additions & 64 deletions end_to_end/gemma/2b/test_gemma.sh

This file was deleted.

31 changes: 0 additions & 31 deletions end_to_end/gemma/7b/1_test_gemma.sh

This file was deleted.

0 comments on commit 9ee125e

Please sign in to comment.