package types

import (
	"fmt"
	"os"
)

type AddVoiceResponse struct {
	VoiceID string `json:"voice_id"`
}

type HistoryPost struct {
	HistoryItemIds []string `json:"history_item_ids"`
}
type Voice struct {
	Name        string     `json:"name"`                  // The name that identifies this voice. This will be displayed in the dropdown of the website.
	Files       []*os.File `json:"files,omitempty"`       // Audio files to add to the voice
	Description string     `json:"description,omitempty"` // How would you describe the voice?
	Labels      string     `json:"labels,omitempty"`      // Serialized labels dictionary for the voice.
}
type TTS struct {
	VoiceID       string           `json:"voice_id"` // The ID of the voice that will be used to generate the speech.
	ModelID       string           `json:"model_id,omitempty"`
	Text          string           `json:"text"`                     // The text that will get converted into speech.
	PreviousText  string           `json:"previous_text,omitempty"`  // The text that was used to generate the previous audio file.
	NextText      string           `json:"next_text,omitempty"`      // The text that will be used to generate the next audio file.
	VoiceSettings SynthesisOptions `json:"voice_settings,omitempty"` // Voice settings are applied only on the given TTS request.
	Stream        bool             `json:"stream,omitempty"`         // If true, the response will be a stream of audio data.
}

type TTSParam func(*TTS)

func (so *SynthesisOptions) Clamp() {
	if so.Stability > 1 || so.Stability < 0 {
		so.Stability = 0.75
	}
	if so.SimilarityBoost > 1 || so.SimilarityBoost < 0 {
		so.SimilarityBoost = 0.75
	}
	if so.Style > 1 || so.Style < 0 {
		so.Style = 0.0
	}
	// UseSpeakerBoost defaults to the zero value (false) for bool;
	// no conditional needed as the caller sets it explicitly.
}

type SynthesisOptions struct {
	Stability       float64 `json:"stability"`
	SimilarityBoost float64 `json:"similarity_boost"`
	Style           float64 `json:"style"`
	UseSpeakerBoost bool    `json:"use_speaker_boost"`
}

type SharingOptions struct {
	Status              string            `json:"status"`
	HistoryItemSampleId string            `json:"history_item_sample_id"`
	OriginalVoiceId     string            `json:"original_voice_id"`
	PublicOwnerId       string            `json:"public_owner_id"`
	LikedByCount        int32             `json:"liked_by_count"`
	ClonedByCount       int32             `json:"cloned_by_count"`
	WhitelistedEmails   []string          `json:"whitelisted_emails"`
	Name                string            `json:"name"`
	Labels              map[string]string `json:"labels"`
	Description         string            `json:"description"`
	ReviewStatus        string            `json:"review_status"`
	ReviewMessage       string            `json:"review_message"`
	EnabledInLibrary    bool              `json:"enabled_in_library"`
}

type ExtendedSubscriptionResponseModel struct {
	Tier                           string                  `json:"tier"`
	CharacterCount                 int32                   `json:"character_count"`
	CharacterLimit                 int32                   `json:"character_limit"`
	CanExtendCharacterLimit        bool                    `json:"can_extend_character_limit"`
	AllowedToExtendCharacterLimit  bool                    `json:"allowed_to_extend_character_limit"`
	NextCharacterCountResetUnix    int32                   `json:"next_character_count_reset_unix"`
	VoiceLimit                     int32                   `json:"voice_limit"`
	ProfessionalVoiceLimit         int32                   `json:"professional_voice_limit"`
	CanExtendVoiceLimit            bool                    `json:"can_extend_voice_limit"`
	CanUseInstantVoiceCloning      bool                    `json:"can_use_instant_voice_cloning"`
	CanUseProfessionalVoiceCloning bool                    `json:"can_use_professional_voice_cloning"`
	AvailableModels                []TtsModelResponseModel `json:"available_models"`
	CanUseDelayedPaymentMethods    bool                    `json:"can_use_delayed_payment_methods"`
	Currency                       string                  `json:"currency"`
	Status                         string                  `json:"status"`
	NextInvoice                    Invoice                 `json:"next_invoice"`
}
type FeedbackResponseModel struct {
	ThumbsUp        bool   `json:"thumbs_up"`
	Feedback        string `json:"feedback"`
	Emotions        bool   `json:"emotions"`
	InaccurateClone bool   `json:"inaccurate_clone"`
	Glitches        bool   `json:"glitches"`
	AudioQuality    bool   `json:"audio_quality"`
	Other           bool   `json:"other"`
	ReviewStatus    string `json:"review_status,omitempty"`
}
type FineTuningResponseModel struct {
	ModelID                   string                             `json:"model_id"`
	IsAllowedToFineTune       bool                               `json:"is_allowed_to_fine_tune"`
	FineTuningRequested       bool                               `json:"fine_tuning_requested"`
	FinetuningState           string                             `json:"finetuning_state"`
	VerificationAttempts      []VerificationAttemptResponseModel `json:"verification_attempts"`
	VerificationFailures      []string                           `json:"verification_failures"`
	VerificationAttemptsCount int32                              `json:"verification_attempts_count"`
	SliceIds                  []string                           `json:"slice_ids"`
}
type GetHistoryResponse struct {
	History []HistoryItemList `json:"history"`
}
type GetVoicesResponseModel struct {
	Voices []VoiceResponseModel `json:"voices"`
}
type HistoryItemList struct {
	HistoryItemID            string                 `json:"history_item_id"`
	RequestID                string                 `json:"request_id"`
	VoiceID                  string                 `json:"voice_id"`
	VoiceName                string                 `json:"voice_name"`
	Text                     string                 `json:"text"`
	DateUnix                 int32                  `json:"date_unix"`
	CharacterCountChangeFrom int32                  `json:"character_count_change_from"`
	CharacterCountChangeTo   int32                  `json:"character_count_change_to"`
	ContentType              string                 `json:"content_type"`
	State                    string                 `json:"state"`
	Settings                 *interface{}           `json:"settings"`
	Feedback                 *FeedbackResponseModel `json:"feedback"`
}
type Invoice struct {
	AmountDueCents         int32 `json:"amount_due_cents"`
	NextPaymentAttemptUnix int32 `json:"next_payment_attempt_unix"`
}
type LanguageResponseModel struct {
	IsoCode     string `json:"iso_code"`
	DisplayName string `json:"display_name"`
}

type Language struct {
	LanguageID string `json:"language_id"`
	Name       string `json:"name"`
}

type ModelResponseModel struct {
	ModelID              string     `json:"model_id"`
	Name                 string     `json:"name"`
	Description          string     `json:"description"`
	CanBeFinetuned       bool       `json:"can_be_finetuned"`
	CanDoTextToSpeech    bool       `json:"can_do_text_to_speech"`
	CanDoVoiceConversion bool       `json:"can_do_voice_conversion"`
	TokenCostFactor      float64    `json:"token_cost_factor"`
	Languages            []Language `json:"languages"`
}
type RecordingResponseModel struct {
	RecordingID    string `json:"recording_id"`
	MimeType       string `json:"mime_type"`
	SizeBytes      int32  `json:"size_bytes"`
	UploadDateUnix int32  `json:"upload_date_unix"`
	Transcription  string `json:"transcription"`
}
type Sample struct {
	SampleID  string `json:"sample_id"`
	FileName  string `json:"file_name"`
	MimeType  string `json:"mime_type"`
	SizeBytes int32  `json:"size_bytes"`
	Hash      string `json:"hash"`
}

type Subscription struct {
	Tier                           string                  `json:"tier"`
	CharacterCount                 int32                   `json:"character_count"`
	CharacterLimit                 int32                   `json:"character_limit"`
	CanExtendCharacterLimit        bool                    `json:"can_extend_character_limit"`
	AllowedToExtendCharacterLimit  bool                    `json:"allowed_to_extend_character_limit"`
	NextCharacterCountResetUnix    int32                   `json:"next_character_count_reset_unix"`
	VoiceLimit                     int32                   `json:"voice_limit"`
	ProfessionalVoiceLimit         int32                   `json:"professional_voice_limit"`
	CanExtendVoiceLimit            bool                    `json:"can_extend_voice_limit"`
	CanUseInstantVoiceCloning      bool                    `json:"can_use_instant_voice_cloning"`
	CanUseProfessionalVoiceCloning bool                    `json:"can_use_professional_voice_cloning"`
	AvailableModels                []TtsModelResponseModel `json:"available_models"`
	CanUseDelayedPaymentMethods    bool                    `json:"can_use_delayed_payment_methods"`
	Currency                       string                  `json:"currency"`
	Status                         string                  `json:"status"`
}
type TtsModelResponseModel struct {
	ModelID           string                  `json:"model_id"`
	DisplayName       string                  `json:"display_name"`
	SupportedLanguage []LanguageResponseModel `json:"supported_language"`
}
type UserResponseModel struct {
	Subscription Subscription `json:"subscription"`
	IsNewUser    bool         `json:"is_new_user"`
	XiAPIKey     string       `json:"xi_api_key"`
}
type ValidationError struct {
	Loc   any    `json:"loc"`
	Msg   string `json:"msg"`
	Type_ string `json:"type"`
}

func (ve ValidationError) Error() string {
	return fmt.Sprintf("%s %s: ", ve.Type_, ve.Msg)
}

type ParamError struct {
	Detail struct {
		Status  string `json:"status"`
		Message string `json:"message"`
	} `json:"detail"`
}

func (pe ParamError) Error() string {
	return fmt.Sprintf("%s %s: ", pe.Detail.Status, pe.Detail.Message)
}

type VerificationAttemptResponseModel struct {
	Text                string                  `json:"text"`
	DateUnix            int32                   `json:"date_unix"`
	Accepted            bool                    `json:"accepted"`
	Similarity          float64                 `json:"similarity"`
	LevenshteinDistance float64                 `json:"levenshtein_distance"`
	Recording           *RecordingResponseModel `json:"recording"`
}
type VoiceResponseModel struct {
	VoiceID                 string                  `json:"voice_id"`
	Name                    string                  `json:"name"`
	Samples                 []Sample                `json:"samples"`
	Category                string                  `json:"category"`
	FineTuning              FineTuningResponseModel `json:"fine_tuning"`
	Labels                  map[string]string       `json:"labels"`
	Description             string                  `json:"description"`
	PreviewURL              string                  `json:"preview_url"`
	AvailableForTiers       []string                `json:"available_for_tiers"`
	Settings                SynthesisOptions        `json:"settings"`
	Sharing                 SharingOptions          `json:"sharing"`
	HighQualityBaseModelIds []string                `json:"high_quality_base_model_ids"`
}

type SoundGeneration struct {
	Text            string  `json:"text"`             // The text that will get converted into a sound effect.
	DurationSeconds float64 `json:"duration_seconds"` // The duration of the sound which will be generated in seconds.
	PromptInfluence float64 `json:"prompt_influence"` // A higher prompt influence makes your generation follow the prompt more closely.
}

type TimestampsGranularity string

const (
	// TimestampsGranularityNone represents no timestamps
	TimestampsGranularityNone TimestampsGranularity = "none"
	// TimestampsGranularityWord represents word-level timestamps
	TimestampsGranularityWord TimestampsGranularity = "word"
	// TimestampsGranularityCharacter represents character-level timestamps
	TimestampsGranularityCharacter TimestampsGranularity = "character"
)

type SpeechToTextModel string

const (
	SpeechToTextModelScribeV1 SpeechToTextModel = "scribe_v1"
)

// SpeechToTextRequest represents a request to the speech-to-text API
type SpeechToTextRequest struct {
	// The ID of the model to use for transcription (currently only 'scribe_v1')
	ModelID SpeechToTextModel `json:"model_id"`
	// ISO-639-1 or ISO-639-3 language code. If not specified, language is auto-detected
	LanguageCode string `json:"language_code,omitempty"`
	// Whether to tag audio events like (laughter), (footsteps), etc.
	TagAudioEvents bool `json:"tag_audio_events,omitempty"`
	// Number of speakers (1-32). If not specified, uses model's maximum supported
	NumSpeakers int `json:"num_speakers,omitempty"`
	// Granularity of timestamps: "none", "word", or "character"
	TimestampsGranularity TimestampsGranularity `json:"timestamps_granularity,omitempty"`
	// Whether to annotate speaker changes (limits input to 8 minutes)
	Diarize bool `json:"diarize,omitempty"`
}

// SpeechToTextResponse represents the response from the speech-to-text API
type SpeechToTextResponse struct {
	// ISO-639-1 language code
	LanguageCode string `json:"language_code"`
	// The probability of the detected language
	LanguageProbability float64 `json:"language_probability"`
	// The transcribed text
	Text string `json:"text"`
	// Detailed word-level information
	Words []TranscriptionWord `json:"words"`
	// Error message, if any
	Error string `json:"error,omitempty"`
}

// TranscriptionWord represents a word or spacing in the transcription
type TranscriptionWord struct {
	// The text content of the word/spacing
	Text string `json:"text"`
	// Type of segment ("word" or "spacing")
	Type string `json:"type"`
	// Start time in seconds
	Start float64 `json:"start"`
	// End time in seconds
	End float64 `json:"end"`
	// Speaker identifier for multi-speaker transcriptions
	SpeakerID string `json:"speaker_id,omitempty"`
	// Character-level information
	Characters []TranscriptionCharacter `json:"characters,omitempty"`
}

// TranscriptionCharacter represents character-level information in the transcription
type TranscriptionCharacter struct {
	// The text content of the character
	Text string `json:"text"`
	// Start time in seconds
	Start float64 `json:"start"`
	// End time in seconds
	End float64 `json:"end"`
}