Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

check is streamable #166

Closed
wants to merge 7 commits into from
Closed
Show file tree
Hide file tree
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
16 changes: 14 additions & 2 deletions elk/extraction/__init__.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,16 @@
from .balanced_sampler import BalancedSampler, FewShotSampler
from .extraction import Extract, extract_hiddens, extract
from .generator import _GeneratorConfig, _GeneratorBuilder
from .extraction import Extract, extract, extract_hiddens
from .generator import _GeneratorBuilder, _GeneratorConfig
from .prompt_loading import PromptConfig, yield_prompts

__all__ = [
"_GeneratorBuilder",
"_GeneratorConfig",
"BalancedSampler",
"extract_hiddens",
"extract",
"Extract",
"FewShotSampler",
"PromptConfig",
"yield_prompts",
]
6 changes: 0 additions & 6 deletions elk/extraction/balanced_sampler.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,12 +9,6 @@
from ..math_util import stochastic_round_constrained
from ..utils import infer_label_column
from ..utils.typing import assert_type
from collections import deque
from datasets import IterableDataset, Features
from itertools import cycle, islice
from random import Random
from torch.utils.data import IterableDataset as TorchIterableDataset
from typing import Iterator, Optional, Iterable


class BalancedSampler(TorchIterableDataset):
Expand Down
1 change: 0 additions & 1 deletion elk/extraction/extraction.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,6 @@
import logging
import os
from dataclasses import InitVar, dataclass
from itertools import islice
from typing import Iterable, Literal, Optional, Union

import torch
Expand Down
10 changes: 0 additions & 10 deletions elk/extraction/prompt_loading.py
Original file line number Diff line number Diff line change
Expand Up @@ -19,16 +19,6 @@
select_train_val_splits,
)
from .balanced_sampler import FewShotSampler
from dataclasses import dataclass
from datasets import (
load_dataset,
Dataset,
Features,
)
from datasets.distributed import split_dataset_by_node
from random import Random
from simple_parsing.helpers import field, Serializable
from typing import Any, Iterator, Literal, Optional


@dataclass
Expand Down
1 change: 1 addition & 0 deletions elk/utils/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,7 @@
"get_columns_all_equal",
"infer_label_column",
"infer_num_classes",
"is_streamable",
"float32_to_int16",
"int16_to_float32",
"select_train_val_splits",
Expand Down
8 changes: 3 additions & 5 deletions elk/utils/data_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,14 +6,12 @@
ClassLabel,
DatasetDict,
Features,
IterableDataset,
Split,
Value,
)
from random import Random
from itertools import islice
from typing import Iterable, List, Any
import copy

from ..promptsource.templates import Template
from .typing import assert_type


def get_columns_all_equal(dataset: DatasetDict) -> list[str]:
Expand Down
4 changes: 1 addition & 3 deletions tests/test_load_prompts.py
Original file line number Diff line number Diff line change
@@ -1,11 +1,9 @@
from elk.extraction import yield_prompts, PromptConfig
from elk.promptsource.templates import DatasetTemplates
from itertools import cycle, islice
from typing import Literal

import pytest

from elk.extraction import PromptConfig, load_prompts
from elk.extraction import PromptConfig, yield_prompts
from elk.promptsource.templates import DatasetTemplates


Expand Down