class SelfInstructPipeline:
5
./data_output.json
(6, 2)
None
def __init__( self, agent: ChatAgent, seed: str, num_machine_instructions: int = 5, data_output_path: Optional[str] = './data_output.json', human_to_machine_ratio: tuple = (6, 2), instruction_filter: Optional[InstructionFilter] = None, filter_config: Optional[Dict[str, Dict[str, Any]]] = None, stop_on_first_failure: bool = False ):
def load_seed(self, path: str):
def sample_human_tasks(self, count: int):
def sample_machine_tasks(self, count: int):
def generate_machine_instruction(self):
def identify_instruction(self, instruction: str):
def generate_machine_instances(self):
def generate_machine_instance(self, instruction: str, classification: bool):
def parse_classification_output(self, generated_text: str):
def parse_non_classification_output(self, generated_text: str):
def construct_data(self):
def generate(self, timeout_minutes = 600):
600