diff --git a/packages/inference/src/HfInference.ts b/packages/inference/src/HfInference.ts
index 6cc268cf29..401abefc5f 100644
--- a/packages/inference/src/HfInference.ts
+++ b/packages/inference/src/HfInference.ts
@@ -5,7 +5,7 @@ import type { DistributiveOmit } from "./utils/distributive-omit";
 /* eslint-disable @typescript-eslint/no-empty-interface */
 /* eslint-disable @typescript-eslint/no-unsafe-declaration-merging */
 
-type Task = typeof tasks;
+type Task = Omit<typeof tasks, "request" | "streamingRequest">;
 
 type TaskWithNoAccessToken = {
 	[key in keyof Task]: (
@@ -21,22 +21,83 @@ type TaskWithNoAccessTokenNoEndpointUrl = {
 	) => ReturnType<Task[key]>;
 };
 
-export class HfInference {
-	private readonly accessToken: string;
-	private readonly defaultOptions: Options;
+export class HfInference implements Task {
+	protected readonly accessToken: string;
+	protected readonly defaultOptions: Options;
+
+	speechToText: typeof tasks.speechToText;
+	audioClassification: typeof tasks.audioClassification;
+	automaticSpeechRecognition: typeof tasks.automaticSpeechRecognition;
+	textToSpeech: typeof tasks.textToSpeech;
+	audioToAudio: typeof tasks.audioToAudio;
+	imageClassification: typeof tasks.imageClassification;
+	imageSegmentation: typeof tasks.imageSegmentation;
+	imageToText: typeof tasks.imageToText;
+	objectDetection: typeof tasks.objectDetection;
+	textToImage: typeof tasks.textToImage;
+	imageToImage: typeof tasks.imageToImage;
+	zeroShotImageClassification: typeof tasks.zeroShotImageClassification;
+	featureExtraction: typeof tasks.featureExtraction;
+	fillMask: typeof tasks.fillMask;
+	questionAnswering: typeof tasks.questionAnswering;
+	sentenceSimilarity: typeof tasks.sentenceSimilarity;
+	summarization: typeof tasks.summarization;
+	tableQuestionAnswering: typeof tasks.tableQuestionAnswering;
+	textClassification: typeof tasks.textClassification;
+	textGeneration: typeof tasks.textGeneration;
+	tokenClassification: typeof tasks.tokenClassification;
+	translation: typeof tasks.translation;
+	zeroShotClassification: typeof tasks.zeroShotClassification;
+	chatCompletion: typeof tasks.chatCompletion;
+	documentQuestionAnswering: typeof tasks.documentQuestionAnswering;
+	visualQuestionAnswering: typeof tasks.visualQuestionAnswering;
+	tabularRegression: typeof tasks.tabularRegression;
+	tabularClassification: typeof tasks.tabularClassification;
+	textGenerationStream: typeof tasks.textGenerationStream;
+	chatCompletionStream: typeof tasks.chatCompletionStream;
+
+	static mapInferenceFn<TOut, TArgs>(instance: HfInference, func: (...args: [TArgs, Options?]) => TOut) {
+		return function (...[args, options]: Parameters<(...args: [TArgs, Options?]) => TOut>): TOut {
+			return func({ ...args, accessToken: instance.accessToken }, { ...instance.defaultOptions, ...(options ?? {}) });
+		};
+	}
 
 	constructor(accessToken = "", defaultOptions: Options = {}) {
 		this.accessToken = accessToken;
 		this.defaultOptions = defaultOptions;
 
-		for (const [name, fn] of Object.entries(tasks)) {
-			Object.defineProperty(this, name, {
-				enumerable: false,
-				value: (params: RequestArgs, options: Options) =>
-					// eslint-disable-next-line @typescript-eslint/no-explicit-any
-					fn({ ...params, accessToken } as any, { ...defaultOptions, ...options }),
-			});
-		}
+		this.speechToText = HfInference.mapInferenceFn(this, tasks.speechToText);
+		this.audioClassification = HfInference.mapInferenceFn(this, tasks.audioClassification);
+		this.automaticSpeechRecognition = HfInference.mapInferenceFn(this, tasks.automaticSpeechRecognition);
+		this.textToSpeech = HfInference.mapInferenceFn(this, tasks.textToSpeech);
+		this.audioToAudio = HfInference.mapInferenceFn(this, tasks.audioToAudio);
+		this.imageClassification = HfInference.mapInferenceFn(this, tasks.imageClassification);
+		this.imageSegmentation = HfInference.mapInferenceFn(this, tasks.imageSegmentation);
+		this.imageToText = HfInference.mapInferenceFn(this, tasks.imageToText);
+		this.objectDetection = HfInference.mapInferenceFn(this, tasks.objectDetection);
+		this.textToImage = HfInference.mapInferenceFn(this, tasks.textToImage);
+		this.imageToImage = HfInference.mapInferenceFn(this, tasks.imageToImage);
+		this.zeroShotImageClassification = HfInference.mapInferenceFn(this, tasks.zeroShotImageClassification);
+		this.featureExtraction = HfInference.mapInferenceFn(this, tasks.featureExtraction);
+		this.fillMask = HfInference.mapInferenceFn(this, tasks.fillMask);
+		this.questionAnswering = HfInference.mapInferenceFn(this, tasks.questionAnswering);
+		this.sentenceSimilarity = HfInference.mapInferenceFn(this, tasks.sentenceSimilarity);
+		this.summarization = HfInference.mapInferenceFn(this, tasks.summarization);
+		this.tableQuestionAnswering = HfInference.mapInferenceFn(this, tasks.tableQuestionAnswering);
+		this.textClassification = HfInference.mapInferenceFn(this, tasks.textClassification);
+		this.textGeneration = HfInference.mapInferenceFn(this, tasks.textGeneration);
+		this.tokenClassification = HfInference.mapInferenceFn(this, tasks.tokenClassification);
+		this.translation = HfInference.mapInferenceFn(this, tasks.translation);
+		this.zeroShotClassification = HfInference.mapInferenceFn(this, tasks.zeroShotClassification);
+		this.chatCompletion = HfInference.mapInferenceFn(this, tasks.chatCompletion);
+		this.documentQuestionAnswering = HfInference.mapInferenceFn(this, tasks.documentQuestionAnswering);
+		this.visualQuestionAnswering = HfInference.mapInferenceFn(this, tasks.visualQuestionAnswering);
+		this.tabularRegression = HfInference.mapInferenceFn(this, tasks.tabularRegression);
+		this.tabularClassification = HfInference.mapInferenceFn(this, tasks.tabularClassification);
+
+		/// Streaming methods
+		this.textGenerationStream = HfInference.mapInferenceFn(this, tasks.textGenerationStream);
+		this.chatCompletionStream = HfInference.mapInferenceFn(this, tasks.chatCompletionStream);
 	}
 
 	/**
diff --git a/packages/inference/src/tasks/index.ts b/packages/inference/src/tasks/index.ts
index ba3108446c..2b91f72949 100644
--- a/packages/inference/src/tasks/index.ts
+++ b/packages/inference/src/tasks/index.ts
@@ -1,3 +1,5 @@
+import { automaticSpeechRecognition } from "./audio/automaticSpeechRecognition";
+
 // Custom tasks with arbitrary inputs and outputs
 export * from "./custom/request";
 export * from "./custom/streamingRequest";
@@ -40,3 +42,5 @@ export * from "./multimodal/visualQuestionAnswering";
 // Tabular tasks
 export * from "./tabular/tabularRegression";
 export * from "./tabular/tabularClassification";
+
+export const speechToText = automaticSpeechRecognition;
diff --git a/packages/inference/test/HfInference.spec.ts b/packages/inference/test/HfInference.spec.ts
index d2db78fd4c..84e12ee8b8 100644
--- a/packages/inference/test/HfInference.spec.ts
+++ b/packages/inference/test/HfInference.spec.ts
@@ -589,18 +589,18 @@ describe.concurrent("HfInference", () => {
 					generated_text: "a large brown and white giraffe standing in a field ",
 				});
 			});
-			it("request - openai-community/gpt2", async () => {
-				expect(
-					await hf.request({
-						model: "openai-community/gpt2",
-						inputs: "one plus two equals",
-					})
-				).toMatchObject([
-					{
-						generated_text: expect.any(String),
-					},
-				]);
-			});
+			// it("request - openai-community/gpt2", async () => {
+			// 	expect(
+			// 		await hf.request({
+			// 			model: "openai-community/gpt2",
+			// 			inputs: "one plus two equals",
+			// 		})
+			// 	).toMatchObject([
+			// 		{
+			// 			generated_text: expect.any(String),
+			// 		},
+			// 	]);
+			// });
 
 			// Skipped at the moment because takes forever
 			it.skip("tabularRegression", async () => {